diff --git a/tests/expected-results-edgy/blast.csv b/tests/expected-results-edgy/blast.csv index ebf15eb..5b79afd 100644 --- a/tests/expected-results-edgy/blast.csv +++ b/tests/expected-results-edgy/blast.csv @@ -1,7 +1,7 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9719,9719,1,9718,1,9719,0.0,13866,99.949,9714,plus,5770-T291TC2358CTCA743GA552 -Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9719,634,1,634,9086,9719,0.0,885,98.738,626,plus,23CA83AG55GT3TA7AG5CT44AG63AG343 -Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9719,634,9085,9718,1,634,0.0,882,98.580,625,plus,23AC57GA25GA55TG3AT7GA5TC44GA63GA343 -Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9719,9719,1,9718,9719,1,0.0,13866,99.949,9714,minus,552CT743GTGA2358AG291-A5770 -Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9719,634,9085,9718,9719,9086,0.0,885,98.738,626,minus,343TC63TC44GA5TC7AT3CA55TC83GT23 -Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9719,634,1,634,634,1,0.0,882,98.580,625,minus,343CT63CT44AG5CT7TA3AC55CT25CT57TG23 +Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9718,9718,1,9718,1,9718,0.0,13882,100.000,9718,plus,9718 +Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9718,634,9085,9718,1,634,0.0,882,98.580,625,plus,23AC57GA25GA55TG3AT7GA5TC44GA63GA343 +Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9718,634,1,634,9085,9718,0.0,882,98.580,625,plus,23CA57AG25AG55GT3TA7AG5CT44AG63AG343 +Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9718,9718,1,9718,9718,1,0.0,13882,100.000,9718,minus,9718 +Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9718,634,1,634,634,1,0.0,882,98.580,625,minus,343CT63CT44AG5CT7TA3AC55CT25CT57TG23 +Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9718,9718,634,9085,9718,9718,9085,0.0,882,98.580,625,minus,343TC63TC44GA5TC7AT3CA55TC25TC57GT23 diff --git a/tests/expected-results-edgy/errors.json b/tests/expected-results-edgy/errors.json index 3c02a75..79f9a33 100644 --- a/tests/expected-results-edgy/errors.json +++ b/tests/expected-results-edgy/errors.json @@ -1,26 +1,4 @@ { - "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455": [ - { - "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" - } - ], - "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED": [ - { - "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED [REVERSED]", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED [REVERSED]", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" - } - ] + "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455": [], + "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED": [] } \ No newline at end of file diff --git a/tests/expected-results-edgy/holistic.json b/tests/expected-results-edgy/holistic.json index 27cb729..5006171 100644 --- a/tests/expected-results-edgy/holistic.json +++ b/tests/expected-results-edgy/holistic.json @@ -4,11 +4,11 @@ "hypermutation_probablility": 0.0, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9718, - "blast_sseq_coverage": 1.1304660973351168, + "blast_sseq_coverage": 1.130479522535501, "blast_qseq_coverage": 1.130479522535501, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED": { @@ -16,11 +16,11 @@ "hypermutation_probablility": 0.0, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9718, - "blast_sseq_coverage": 1.1304660973351168, + "blast_sseq_coverage": 1.130479522535501, "blast_qseq_coverage": 1.130479522535501, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-edgy/intact.fasta b/tests/expected-results-edgy/intact.fasta index e69de29..8ed7374 100644 --- a/tests/expected-results-edgy/intact.fasta +++ b/tests/expected-results-edgy/intact.fasta @@ -0,0 +1,326 @@ +>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455 +TGGAAGGGCTAATTCACTCCCAACGAAGACAAGATATCCTTGATCTGTGGATCTACCACA +CACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGATCAGATATCCAC +TGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGTTAGAAGAAGCCA +ACAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCGG +AGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAG +AGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCG +CTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGAT +CCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +GCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +TGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTC +AGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAG +CGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGG +CAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGA +AGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAA +AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCA +AGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGT +AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCA +TTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACC +AAGGAAGCTTTAGACAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAA +GCAGCAGCTGACACAGGACACAGCAATCAGGTCAGCCAAAATTACCCTATAGTGCAGAAC +ATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAA +GTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTGATACCCATGTTTTCAGCATTATCAGAA +GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCC +ATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCA +GTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCA +GGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCA +GTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTAT +AGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTA +GACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG +ACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTG +GGACCAGCGGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGC +CATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATG +ATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAA +GAAGGGCACACAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGA +AAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATC +TGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCC +CCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCCCTCAGAAGCAGGAG +CCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGGTCACTCTTTGGCAACGACCCC +TCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATG +ATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAA +TTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATA +AAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGT +TGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGCCCTATTGAGACTGTACCAGTAA +AATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAA +TAAAAGCATTAGTAGAAATTTGTACAGAGATGGAAAAGGAAGGGAAAATTTCAAAAATTG +GGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAAT +GGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTC +AATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATG +TGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTA +CCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCAC +AGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTT +TTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGAT +CTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGA +GGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGG +GTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACA +GCTGGACTGTCAATGACATACAGAAGTTAGTGGGGAAATTGAATTGGGCAAGTCAGATTT +ACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAG +AAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAA +AAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGA +AGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAA +CAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGG +CAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAAC +TGCCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGA +TTCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGA +AAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTA +AATTAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTGTCACCCTAACTG +ACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGAT +TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG +ATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGG +TCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAAT +TAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATG +AACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTG +TAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGC +ATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAA +AAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAG +CAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAA +AAACAATACATACTGACAATGGCAGCAATTTCACCGGTGCTACGGTTAGGGCCGCCTGTT +GGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAG +TAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAAC +ATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGA +TTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTA +AAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCA +GAAATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAA +TACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATT +ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACA +TGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTAT +AGACATCACTATGAAAGCCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGG +GATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCAT +TTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCT +GAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATA +AGAAAGGCCTTATTAGGACACATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAAC +AAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAG +CCACCTTTGCCTAGTGTTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACC +AAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGA +ATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATG +AAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGC +TGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGGA +GAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAG +CCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGT +TTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGA +GCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGTA +ATGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATA +GTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGAC +AGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAA +ATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGAT +GATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAA +GGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACA +TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATT +GGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGA +GGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG +TGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGAG +AATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAG +AGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATAA +TGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCC +AAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCT +AAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACA +ATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGC +AGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAGT +ACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAG +AATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATAT +GAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAGC +TAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGG +AGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAA +TTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAA +TAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACAT +GTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTTC +ATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCGA +GATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATA +TAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGT +GCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGC +AGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTC +TGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTT +GCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATA +CCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCAC +TGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACAC +GACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAAT +TGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATG +GGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCAT +AATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAA +TAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGGG +ACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAT +TCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTT +CAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGG +ACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGA +ACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGAC +AGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAAG +AATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGTA +GTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATA +GGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAG +CAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTC +CAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCC +ACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATA +TCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACAC +CAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTG +AGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGA +GCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCC +TAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATC +GAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGA +CTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG +TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTG +CTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGT +GACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA +>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED +TGCTAGAGATTTTCCACACTGACTAAAAGGGTCTGAGGGATCTCTAGTTACCAGAGTCAC +ACAACAGACGGGCACACACTACTTGAAGCACTCAAGGCAAGCTTTATTGAGGCTTAAGCA +GTGGGTTCCCTAGTTAGCCAGAGAGCTCCCAGGCTCAGATCTGGTCTAACCAGAGAGACC +CAGTACAGGCAAAAAGCAGCTGCTTATATGCAGGATCTGAGGGCTCGCCACTCCCCAGTC +CCGCCCAGGCCACGCCTCCCTGGAAAGTCCCCAGCGGAAAGTCCCTTGTAGCAAGCTCGA +TGTCAGCAGTTCTTGAAGTACTCCGGATGCAGCTCTCGGGCCACGTGATGAAATGCTAGG +CGGCTGTCAAACCTCCACTCTAACACTTCTCTCTCCGGGTCATCCATCCCATGCAGGCTC +ACAGGGTGTAACAAGCTGGTGTTCTCTCCTTTATTGGCCTCTTCTATCTTATCTGGCTCA +ACTGGTACTAGCTTGTAGCACCATCCAAAGGTCAGTGGATATCTGACCCCTGGCCCTGGT +GTGTAGTTCTGCCAATCAGGGAAGTAGCCTTGTGTGTGGTAGATCCACAGATCAAGGATA +TCTTGTCTTCTTTGGGAGTGAATTAGCCCTTCCAGTCCCCCCTTTTCTTTTAAAAAGTGG +CTAAGATCTACAGCTGCCTTGTAAGTCATTGGTCTTAAAGGTACCTGAGGTGTGACTGGA +AAACCCACCTCCTCCTCCTCTTGTGCTTCTAGCCAGGCACAAGCAGCATTGGTAGCTGCT +GTATTGCTACTTGTGATTGCTCCATGTTTTTCCAGGTCTCGAGATGCTGCTCCCACCCTA +TCTGCTGCTGGCTCAGCTCGTCTCATTCTTTCCCTTACAGTAGGCCATCCAATCACACTA +CTTTTTGACCACTTGCCACCCATCTTATAGCAAAATCCTTTCCAAGCCCTGTCTTATTCT +TCTAGGTATGTGGCGAATAGCTCTACAAGCTCCTTGTACTACTTCTATAACCCTATCTGT +CCCCTCAGCTACTGCTATGGCTGTGGCATTGAGCAAGCTAACAGCACTATTCTTTAGTTC +CTGACTCCAATACTGTAGGAGATTCCACCAATATTTGAGGGCTTCCCACCCCCTGCGTCC +CAGAAGTTCCACAATCCTCGTTACAATCAAGAGTAAGTCTCTCAAGCGGTGGTAGCTGAA +GAGGCACAGGCTCCGCAGATCGTCCCAGATAAGTGCCAAGGATCCGTTCACTAATCGAAT +GGATCTGTCTCTGTCTCTCTCTCCACCTTCTTCTTCGGTTCCTTCGGGCCTGTCGGGTCC +CCTCGGGGTTGGGAGGTGGGTCTGAAACGATAATGGTGAATATCCCTGCCTAACTCTATT +CACTATAGAAAGTACAGCAAAAACTATTCTTAAACCTACCAAGCCTCCTACTATCATTAT +GAATAATTTTATATACCACAGCCAATTTGTTATGTTAAACCAATTCCACAAACTTGCCCA +TTTATCTAATTCCAATAATTCTTGTTCATTCTTTTCTTGCTGGTTTTGCGATTCTTCAAT +TAAGGAGTGTATTAAGCTTGTGTAATTGTTAATTTCTCTGTCCCACTCCATCCAGGTCGT +GTGATTCCAAATCTGTTCCAGAGATTTATTACTCCAACTAGCATTCCAAGGCACAGCAGT +GGTGCAAATGAGTTTTCCAGAGCAACCCCAAATCCCCAGGAGCTGTTGATCCTTTAGGTA +TCTTTCCACAGCCAGGATTCTTGCCTGGAGCTGCTTGATGCCCCAGACTGTGAGTTGCAA +CAGATGCTGTTGCGCCTCAATAGCCCTCAGCAAATTGTTCTGCTGCTGCACTATACCAGA +CAATAATTGTCTGGCCTGTACCGTCAGCGTCATTGAGGCTGCGCCCATAGTGCTTCCTGC +TGCTCCCAAGAACCCAAGGAACAAAGCTCCTATTCCCACTGCTCTTTTTTCTCTCTGCAC +CACTCTTCTCTTTGCCTTGGTGGGTGCTACTCCTAATGGTTCAATTTTTACTACTTTATA +TTTATATAATTCACTTCTCCAATTGTCCCTCATATCTCCTCCTCCAGGTCTGAAGATCTC +GGACTCATTGTTGCTATTACCACCATCTCTTGTTAATAGCAGCCCTGTAATATTTGATGA +ACATCTAATTTGTCCACTGATGGGAGGGGCATACATTGCTTTTCCTACTTTCTGCCACAT +GTTTATAATTTGTTTTATTCTGCATGGGAGGGTGATTGTGTCACTTCCTTCAGTGTTATT +TGACCCTTCAGTACTCCAAGTACTATTAAACCAAGTACTATTAAACAGTTGTGTTGAATT +ACAGTAGAAAAATTCCCCTCCACAATTAAAACTGTGCGTTACAATTTCTGGGTCCCCTCC +TGAGGATTGCTTAAAGATTATTGTTTTATTATTTCCAAATTGTTCTCTTAATTTGCTAGC +TATCTGTTTTAAAGTGTTATTCCATTTTGCTCTACTAATGTTACAATGTGCTTGTCTCAT +ATTTCCTATTTTTCCTATTGTAACAAATGCTCTCCCTGGTCCTCTCTGGATACGGATTCT +TTTTCTTGTATTGTTGTTGGGTCTTGTACAATTAATTTCTACAGATGTGTTCAGCTGTAC +TATTATGGTTTTAGCATTGTCCGTGAAATTGACAGATCTAATTACTACCTCTTCTTCTGC +TAGACTGCCATTTAACAGCAGTTGAGTTGATACTACTGGCCTAATTCCATGTGTACATTG +TACTGTGCTGACATTTGTACATGGTCCTGTTCCATTGAACGTCTTATTATTACATTTTAG +AATCGCAAAACCAGCCGGGGCACAATAATGTATGGGAATTGGCTCAAAGGATACCTTTGG +ACAGGCCTGTGTAATGACTGAGGTGTTACAACTTGTCAACTTATAGCTGGTAGTATCATT +ATCTATTGGTATTATATCAAGTTTATAAAAAAATGCATATTCTTTCTGCACCTTACCTCT +TATGCTTGTGCTGATATTGAAAGAGCAGTTTTTTATCTCTCCTTTCTCCATTATCATTCT +CCCGCTACTACTATTGGTATTAGTATCATTCTTCAAATCAGTGCACTTTAAACTAACACA +GAGTGGGGTTAATTTTACACATGGCTTTAGGCTTTGATCCCATAAACTGATTATATCCTC +ATGCATCTGTTCTACCATGTCATTTTTCCACATGTTAAAATTTTCTGTCACATTTACCAA +TACTACTTCTTGTGGGTTGGGGTCTGTGGGTACACAGGCATGTGTGGCCCAAACATTATG +TACCTCTGTATCATATGCTTTAGCATCTGATGCACAAAATAGAGTGGTGGTTGCTTCCTT +CCACACAGGTACCCCATAATAGACTGTGACCCACAATTTTTCTGTAGCACTACAGATCAT +CAACATCCCAAGGAGCATGGTGCCCCATCTCCACCCCCATCTCCACAAGTGCTGATATTT +CTCCTTCACTCTCATTGCCACTGTCTTCTGCTCTTTCTATTAGTCTATCAATTAACCTGT +CTATTTTTCTTTGTCTTAATATTTTCCTATATTCTATGATTACTATGGACCACACAACTA +TTGCTATTATTATTGCTACTACTAATGCTACTATTGCTACTATTGGTATAGGTTGCATTA +CATGTACTACTTACTGCTTTGATAGAGAAGCTTGATGAGTCTGACTGTTCTGATGAGCTC +TTCGTCGCTGTCTCCGCTTCTTCCTGCCATAGGAGATGCCTAAGGCTTTTGTTATGAAAC +AAACTTGGCAATGAAAGCAACACTTTTTACAATAGCAATTGGTACAAGCAGTTTTAGGCT +GACTTCCTGGATGCTTCCAGGGCTCTAGTCTAGGATCTACTGGCTCCATTTCTTGCTCTC +CTCTGTCGAGTAACGCCTATTCTGCTATGTCGACACCCAATTCTGAAATGGATAAACAGC +AGTTGTTGCAGAATTCTTATTATGGCTTCCACTCCTGCCCAAGTATCCCCATAAGTTTCA +TAGATATGTTGCCCTAAGCCATGGAGCCAAATCCTAGGAAAATGTCTAACAGCTTCATTC +TTAAGCTCCTCTAAAAGCTCTAGTGTCCATTCATTGTGTGGCTCCCTCTGTGGCCCTTGG +TCTTCTGGGGCTTGTTCCATCTATCCTCTGTCAGTTTCGTAACACTAGGCAAAGGTGGCT +TTATCTTTTTTGGTGTTATTAATGCTGCTAGTGCCAAGTATTGTAGAGATCCTACCTTGT +TATGTCCTGCTTGATATTCACACCTAGGGCTAACTATGTGTCCTAATAAGGCCTTTCTTA +TAGCAGAGTCTGAAAAACAGTCAAAGTAATACAGATGAATTAGTTGGTCTGCTAGTTCAG +GGTCTACTTGTGTGCTATATCTCTTTTTCCTCCATTCTATGGAGACTCCCTGACCCAAAT +GCCAGTCTCTTTCTCCTGTATGCAGACCCCAATATGTTGTTATTACCAATCTAGCATCCC +CTAGTGGGATGTGTACTTCTGAACTTATTCTTGGATGAGGGCTTTCATAGTGATGTCTAT +AAAACCATCCCCTAGCTTTCCCTGAAACATACATATGGTGTTTTACTAAACTTTTCCATG +TTCTAATCCTCATCCTGTCTACTTGCCACACAATCATCACCTGCCATCTGTTTTCCATAA +TCCCTAATGATCTTTGCTTTTCTTCTTGGCACTACTTTTATGTCACTATTATCTTGTATT +ACTACTGCCCCTTCACCTTTCCAGAGGAGCTTTGCTGGTCCTTTCCAAAGTGGATTTCTG +CTGTCCCTGTAATAAACCCGAAAATTTTGAATTTTTGTAATTTGTTTTTGTAATTCTTTA +GTTTGTATGTCTGTTGCTATTATGTCTACTATTCTTTCCCCTGCACTGTACCCCCCAATC +CCCCCTTTTCTTTTAAAATTGTGGATGAATACTGCCATTTGTACTGCTGTCTTAAGATGT +TCAGCCTGATCTCTTACCTGTCCTATAATTTTCTTTAATTCTTTATTCATAGATTCTACT +ACTCCTTGACTTTGGGGATTGTAGGGAATTCCAAATTCCTGCTTGATTCCCGCCCACCAA +CAGGCGGCCCTAACCGTAGCACCGGTGAAATTGCTGCCATTGTCAGTATGTATTGTTTTT +ACTGGCCATCTTCCTGCTAATTTTAAAAGAAAATATGCTGTTTCCTGCCCTGTTTCTGCT +GGAATAACTTCTGCTTCTATATATCCACTGGCTACATGAACTGCTACCAGGATAACTTTT +CCTTCTAAATGTGTACAATCTAGTTGCCATATTCCTGGACTACAGTCTACTTGTCCATGC +ATGGCTTCTCCTTTTAGCTGACATTTATCACAGCTGGCTACTATTTCTTTTGCTACTACA +GGTGGCAGGTTAAAATCACTAGCCATTGCTCTCCAATTACTGTGATATTTCTCATGTTCA +TCTTGGGCCTTATCTATTCCATCTAAAAATAGTACTTTCCTGATTCCAGCACTGACTAAT +TTATCTACTTGTTCATTTCCTCCAATTCCTTTGTGTGCTGGTACCCATGCCAGATAGACC +TTTTCCTTTTTTATTAACTGCTCTATTATTTGATTGACTAACTCTGATTCACTTTGATCT +GGTTGTGCTTGAATGATTCCTAATGCATATTGTGAGTCTGTTACTATGTTTACTTCTAAT +CCCGAATCCTGCAAAGCTAGATAAATTGCTTGTAACTCAGTCTTCTGATTTGTTGTGTCA +GTTAGGGTGACAACTTTTTGTCTTCCTCTATTAGTAACATATCCTGCTTTTCCTAATTTA +GTCTCCCTGTTAGCTGCCCCATCTACATAGAAGGTTTCTGCTCCTACTATGGGTTCTTTC +TCTAACTGGTACCATAATTTCACTAAGGGAGGGGTATTAACAAACTCCCACTCAGGAATC +CAGGTGGCTTGCCAATACTCTGTCCACCATGTTTCCCATGTTTCCTTTTGTATGGGCAGT +TTAAATTTAGGAGTCTTTCCCCATATTACTATGCTTTCTGTGGTTATTTTTTGCACTGCC +TCTGTTAATTGTTTTACATCATTAGTGTGGGCACCCCTCATTCTTGCATATTTTCCTGTT +TTCAGATTTTTAAATGGCTCTTGATAAATTTGATATGTCCATTGGCCTTGCCCCTGCTTC +TGTATTTCTGCTATTAAGTCTTTTGATGGGTCATAATACACTCCATGTACTGGTTCTTTT +AGAATCTCTCTGTTTTCTGCCAGTTCTAGCTCTGCTTCTTCTGTTAGTGGTATTACTTCT +GTTAGTGCTTTGGTTCCTCTAAGGAGTTTACATAATTGCCTTACTTTAATCCCTGGGTAA +ATCTGACTTGCCCAATTCAATTTCCCCACTAACTTCTGTATGTCATTGACAGTCCAGCTG +TCTTTTTCTGGCAGCACTATAGGCTGTACTGTCCATTTATCAGGATGGAGTTCATAACCC +ATCCAAAGGAATGGAGGTTCTTTCTGATGTTTTTTGTCTGGTGTGGTAAGTCCCCACCTC +AACAGATGTTGTCTCAGCTCCTCTATTTTTGTTCTATGCTGCCCTATTTCTAAGTCAGAT +CCTACATACAAATCATCCATGTATTGATAGATAACTATGTCTGGATTTTGTTTTCTAAAA +GGCTCTAAGATTTTTGTCATGCTACTTTGGAATATTGCTGGTGATCCTTTCCATCCCTGT +GGAAGCACATTGTACTGATATCTAATCCCTGGTGTCTCATTGTTTATACTAGGTATGGTA +AATGCAGTATACTTCCTGAAGTCTTCATCTAAGGGAACTGAAAAATATGCATCACCCACA +TCCAGTACTGTTACTGATTTTTTCTTTTTTAACCCTGCGGGATGTGGTATTCCTAATTGA +ACTTCCCAGAAGTCTTGAGTTCTCTTATTAAGTTCTCTGAAATCTACTAATTTTCTCCAT +TTAGTACTGTCTTTTTTCTTTATGGCAAATACTGGAGTATTGTATGGATTTTCAGGCCCA +ATTTTTGAAATTTTCCCTTCCTTTTCCATCTCTGTACAAATTTCTACTAATGCTTTTATT +TTTTCTTCTGTCAATGGCCATTGTTTAACTTTTGGGCCATCCATTCCTGGCTTTAATTTT +ACTGGTACAGTCTCAATAGGGCTAATGGGAAAATTTAAAGTGCAACCAATCTGAGTCAAC +AGATTTCTTCCAATTATGTTGACAGGTGTAGGTCCTACTAATACTGTACCTATAGCTTTA +TGTCCACAGATTTCTATGAGTATCTGATCATACTGTCTTACTTTGATAAAACCTCCAATT +CCCCCTATCATTTTTGGTTTCCATCTTCCTGGCAAACTCATTTCTTCTAATACTGTATCA +TCTGCTCCTGTATCTAATAGAGCTTCCTTTAGTTGCCCCCCTATCTTTATTGTGACGAGG +GGTCGTTGCCAAAGAGTGACCTGAGGGAAGTTAAAGGATACAGTTCCTTGTCTATCGGCT +CCTGCTTCTGAGGGGGAGTTGTTGTCTCTACCCCAGACCTGAAGCTCTCTTCTGGTGGGG +CTGTTGGCTCTGGTCTGCTCTGAAGAAAATTCCCTGGCCTTCCCTTGTAGGAAGGCCAGA +TCTTCCCTAAAAAATTAGCCTGTCTCTCAGTACAATCTTTCATTTGGTGTCCTTCCTTTC +CACATTTCCAACAGCCCTTTTTCCTAGGGGCCCTGCAATTTCTGGCTGTGTGCCCTTCTT +TGCCACAATTGAAACACTTAACAATCTTTCTTTGGTTCCTAAAATTGCCTCTCTGCATCA +TTATGGTAGCTGAATTTGTTACTTGGCTCATTGCTTCAGCCAAAACTCTTGCCTTATGGC +CGGGTCCTCCTACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCCGCTGGTCCCA +ATGCTTTTAAAATAGTCTTACAATCTGGGTTCGCATTTTGGACCAACAAGGTTTCTGTCA +TCCAATTTTTTACCTCCTGTGAAGCTTGCTCGGCTCTTAGAGTTTTATAGAACCGGTCTA +CATAGTCTCTAAAGGGTTCCTTTGGTCCTTGTCTTATGTCCAGAATGCTGGTAGGGCTAT +ACATTCTTACTATTTTATTTAATCCCAGGATTATCCATCTTTTATAAATTTCTCCTACTG +GGATAGGTGGATTATTTGTCATCCATCCTATTTGTTCCTGAAGGGTACTAGTAGTTCCTG +CTATGTCACTTCCCCTTGGTTCTCTCATCTGGCCTGGTGCAATAGGCCCTGCATGCACTG +GATGCACTCTATCCCATTCTGCAGCTTCCTCATTGATGGTCTCTTTTAACATTTGCATGG +CTGCTTGATGTCCCCCCACTGTGTTTAGCATGGTGTTTAAATCTTGTGGGGTGGCTCCTT +CTGATAATGCTGAAAACATGGGTATCACTTCTGGGCTGAAAGCCTTCTCTTCTACTACTT +TTACCCATGCATTTAAAGTTCTAGGTGATATGGCCTGATGTACCATTTGCCCCTGGATGT +TCTGCACTATAGGGTAATTTTGGCTGACCTGATTGCTGTGTCCTGTGTCAGCTGCTGCTT +GCTGTGCTTTTTTCTTACTTTTGTTTTGCTCTTCCTCTATCTTGTCTAAAGCTTCCTTGG +TGTCTTTTATCTCTATCCTTTGATGCACACAATAGAGGGTTGCTACTGTATTATATAATG +ATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTCCCAGTATTTGTCTAC +AGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGCTCCCTGCTTG +CCCATACTATATGTTTTAATTTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTTT +CCCATCGATCTAATTCTCCCCCGCTTAATACTGACGCTCTCGCACCCATCTCTCTCCTTC +TAGCCTCCGCTAGTCAAAATTTTTGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCC +GTGCGCGCTTCAGCAAGCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCCCTTTCGCT +TTCAGGTCCCTGTTCGGGCGCCACTGCTAGAGATTTTCCACACTGACTAAAAGGGTCTGA +GGGATCTCTAGTTACCAGAGTCACACAACAGACGGGCACACACTACTTGAAGCACTCAAG +GCAAGCTTTATTGAGGCTTAAGCAGTGGGTTCCCTAGTTAGCCAGAGAGCTCCCAGGCTC +AGATCTGGTCTAACCAGAGAGACCCAGTACAGGCAAAAAGCAGCTGCTTATATGCAGGAT +CTGAGGGCTCGCCACTCCCCAGTCCCGCCCAGGCCACGCCTCCCTGGAAAGTCCCCAGCG +GAAAGTCCCTTGTAGCAAGCTCGATGTCAGCAGTTCTTGAAGTACTCCGGATGCAGCTCT +CGGGCCATGTGATGAAATGCTAGGCGGCTGTCAAACCTCCACTCTAACACTTCTCTCTCC +GGGTCATCCATTCCATGCAGGCTCACAGGGTGTAACAAGCTGGTGTTCTCTCCTTTGTTG +GCTTCTTCTAACTTCTCTGGCTCAACTGGTACTAGCTTGTAGCACCATCCAAAGGTCAGT +GGATATCTGATCCCTGGCCCTGGTGTGTAGTTCTGCTAATCAGGGAAGTAGCCTTGTGTG +TGGTAGATCCACAGATCAAGGATATCTTGTCTTCGTTGGGAGTGAATTAGCCCTTCCA diff --git a/tests/expected-results-edgy/nonintact.fasta b/tests/expected-results-edgy/nonintact.fasta index 8ed7374..e69de29 100644 --- a/tests/expected-results-edgy/nonintact.fasta +++ b/tests/expected-results-edgy/nonintact.fasta @@ -1,326 +0,0 @@ ->Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455 -TGGAAGGGCTAATTCACTCCCAACGAAGACAAGATATCCTTGATCTGTGGATCTACCACA -CACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGATCAGATATCCAC -TGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGTTAGAAGAAGCCA -ACAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCGG -AGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAG -AGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCG -CTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGAT -CCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA -GCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT -TGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTC -AGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAG -CGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGG -CAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGA -AGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAA -AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCA -AGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGT -AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCA -TTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACC -AAGGAAGCTTTAGACAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAA -GCAGCAGCTGACACAGGACACAGCAATCAGGTCAGCCAAAATTACCCTATAGTGCAGAAC -ATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAA -GTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTGATACCCATGTTTTCAGCATTATCAGAA -GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCC -ATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCA -GTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCA -GGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCA -GTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTAT -AGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTA -GACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG -ACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTG -GGACCAGCGGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGC -CATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATG -ATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAA -GAAGGGCACACAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGA -AAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATC -TGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCC -CCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCCCTCAGAAGCAGGAG -CCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGGTCACTCTTTGGCAACGACCCC -TCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATG -ATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAA -TTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATA -AAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGT -TGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGCCCTATTGAGACTGTACCAGTAA -AATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAA -TAAAAGCATTAGTAGAAATTTGTACAGAGATGGAAAAGGAAGGGAAAATTTCAAAAATTG -GGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAAT -GGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTC -AATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATG -TGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTA -CCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCAC -AGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTT -TTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGAT -CTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGA -GGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGG -GTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACA -GCTGGACTGTCAATGACATACAGAAGTTAGTGGGGAAATTGAATTGGGCAAGTCAGATTT -ACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAG -AAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAA -AAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGA -AGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAA -CAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGG -CAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAAC -TGCCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGA -TTCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGA -AAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTA -AATTAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTGTCACCCTAACTG -ACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGAT -TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG -ATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGG -TCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAAT -TAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATG -AACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTG -TAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGC -ATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAA -AAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAG -CAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAA -AAACAATACATACTGACAATGGCAGCAATTTCACCGGTGCTACGGTTAGGGCCGCCTGTT -GGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAG -TAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAAC -ATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGA -TTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTA -AAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCA -GAAATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAA -TACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATT -ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACA -TGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTAT -AGACATCACTATGAAAGCCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGG -GATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCAT -TTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCT -GAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATA -AGAAAGGCCTTATTAGGACACATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAAC -AAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAG -CCACCTTTGCCTAGTGTTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACC -AAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGA -ATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATG -AAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGC -TGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGGA -GAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAG -CCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGT -TTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGA -GCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGTA -ATGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATA -GTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGAC -AGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAA -ATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGAT -GATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAA -GGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACA -TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATT -GGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGA -GGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG -TGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGAG -AATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAG -AGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATAA -TGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCC -AAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCT -AAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACA -ATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGC -AGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAGT -ACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAG -AATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATAT -GAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAGC -TAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGG -AGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAA -TTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAA -TAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACAT -GTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTTC -ATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCGA -GATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATA -TAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGT -GCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGC -AGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTC -TGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTT -GCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATA -CCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCAC -TGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACAC -GACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAAT -TGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATG -GGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCAT -AATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAA -TAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGGG -ACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAT -TCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTT -CAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGG -ACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGA -ACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGAC -AGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAAG -AATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGTA -GTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATA -GGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAG -CAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTC -CAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCC -ACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATA -TCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACAC -CAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTG -AGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGA -GCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCC -TAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATC -GAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGA -CTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG -TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTG -CTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGT -GACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA ->Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED -TGCTAGAGATTTTCCACACTGACTAAAAGGGTCTGAGGGATCTCTAGTTACCAGAGTCAC -ACAACAGACGGGCACACACTACTTGAAGCACTCAAGGCAAGCTTTATTGAGGCTTAAGCA -GTGGGTTCCCTAGTTAGCCAGAGAGCTCCCAGGCTCAGATCTGGTCTAACCAGAGAGACC -CAGTACAGGCAAAAAGCAGCTGCTTATATGCAGGATCTGAGGGCTCGCCACTCCCCAGTC -CCGCCCAGGCCACGCCTCCCTGGAAAGTCCCCAGCGGAAAGTCCCTTGTAGCAAGCTCGA -TGTCAGCAGTTCTTGAAGTACTCCGGATGCAGCTCTCGGGCCACGTGATGAAATGCTAGG -CGGCTGTCAAACCTCCACTCTAACACTTCTCTCTCCGGGTCATCCATCCCATGCAGGCTC -ACAGGGTGTAACAAGCTGGTGTTCTCTCCTTTATTGGCCTCTTCTATCTTATCTGGCTCA -ACTGGTACTAGCTTGTAGCACCATCCAAAGGTCAGTGGATATCTGACCCCTGGCCCTGGT -GTGTAGTTCTGCCAATCAGGGAAGTAGCCTTGTGTGTGGTAGATCCACAGATCAAGGATA -TCTTGTCTTCTTTGGGAGTGAATTAGCCCTTCCAGTCCCCCCTTTTCTTTTAAAAAGTGG -CTAAGATCTACAGCTGCCTTGTAAGTCATTGGTCTTAAAGGTACCTGAGGTGTGACTGGA -AAACCCACCTCCTCCTCCTCTTGTGCTTCTAGCCAGGCACAAGCAGCATTGGTAGCTGCT -GTATTGCTACTTGTGATTGCTCCATGTTTTTCCAGGTCTCGAGATGCTGCTCCCACCCTA -TCTGCTGCTGGCTCAGCTCGTCTCATTCTTTCCCTTACAGTAGGCCATCCAATCACACTA -CTTTTTGACCACTTGCCACCCATCTTATAGCAAAATCCTTTCCAAGCCCTGTCTTATTCT -TCTAGGTATGTGGCGAATAGCTCTACAAGCTCCTTGTACTACTTCTATAACCCTATCTGT -CCCCTCAGCTACTGCTATGGCTGTGGCATTGAGCAAGCTAACAGCACTATTCTTTAGTTC -CTGACTCCAATACTGTAGGAGATTCCACCAATATTTGAGGGCTTCCCACCCCCTGCGTCC -CAGAAGTTCCACAATCCTCGTTACAATCAAGAGTAAGTCTCTCAAGCGGTGGTAGCTGAA -GAGGCACAGGCTCCGCAGATCGTCCCAGATAAGTGCCAAGGATCCGTTCACTAATCGAAT -GGATCTGTCTCTGTCTCTCTCTCCACCTTCTTCTTCGGTTCCTTCGGGCCTGTCGGGTCC -CCTCGGGGTTGGGAGGTGGGTCTGAAACGATAATGGTGAATATCCCTGCCTAACTCTATT -CACTATAGAAAGTACAGCAAAAACTATTCTTAAACCTACCAAGCCTCCTACTATCATTAT -GAATAATTTTATATACCACAGCCAATTTGTTATGTTAAACCAATTCCACAAACTTGCCCA -TTTATCTAATTCCAATAATTCTTGTTCATTCTTTTCTTGCTGGTTTTGCGATTCTTCAAT -TAAGGAGTGTATTAAGCTTGTGTAATTGTTAATTTCTCTGTCCCACTCCATCCAGGTCGT -GTGATTCCAAATCTGTTCCAGAGATTTATTACTCCAACTAGCATTCCAAGGCACAGCAGT -GGTGCAAATGAGTTTTCCAGAGCAACCCCAAATCCCCAGGAGCTGTTGATCCTTTAGGTA -TCTTTCCACAGCCAGGATTCTTGCCTGGAGCTGCTTGATGCCCCAGACTGTGAGTTGCAA -CAGATGCTGTTGCGCCTCAATAGCCCTCAGCAAATTGTTCTGCTGCTGCACTATACCAGA -CAATAATTGTCTGGCCTGTACCGTCAGCGTCATTGAGGCTGCGCCCATAGTGCTTCCTGC -TGCTCCCAAGAACCCAAGGAACAAAGCTCCTATTCCCACTGCTCTTTTTTCTCTCTGCAC -CACTCTTCTCTTTGCCTTGGTGGGTGCTACTCCTAATGGTTCAATTTTTACTACTTTATA -TTTATATAATTCACTTCTCCAATTGTCCCTCATATCTCCTCCTCCAGGTCTGAAGATCTC -GGACTCATTGTTGCTATTACCACCATCTCTTGTTAATAGCAGCCCTGTAATATTTGATGA -ACATCTAATTTGTCCACTGATGGGAGGGGCATACATTGCTTTTCCTACTTTCTGCCACAT -GTTTATAATTTGTTTTATTCTGCATGGGAGGGTGATTGTGTCACTTCCTTCAGTGTTATT -TGACCCTTCAGTACTCCAAGTACTATTAAACCAAGTACTATTAAACAGTTGTGTTGAATT -ACAGTAGAAAAATTCCCCTCCACAATTAAAACTGTGCGTTACAATTTCTGGGTCCCCTCC -TGAGGATTGCTTAAAGATTATTGTTTTATTATTTCCAAATTGTTCTCTTAATTTGCTAGC -TATCTGTTTTAAAGTGTTATTCCATTTTGCTCTACTAATGTTACAATGTGCTTGTCTCAT -ATTTCCTATTTTTCCTATTGTAACAAATGCTCTCCCTGGTCCTCTCTGGATACGGATTCT -TTTTCTTGTATTGTTGTTGGGTCTTGTACAATTAATTTCTACAGATGTGTTCAGCTGTAC -TATTATGGTTTTAGCATTGTCCGTGAAATTGACAGATCTAATTACTACCTCTTCTTCTGC -TAGACTGCCATTTAACAGCAGTTGAGTTGATACTACTGGCCTAATTCCATGTGTACATTG -TACTGTGCTGACATTTGTACATGGTCCTGTTCCATTGAACGTCTTATTATTACATTTTAG -AATCGCAAAACCAGCCGGGGCACAATAATGTATGGGAATTGGCTCAAAGGATACCTTTGG -ACAGGCCTGTGTAATGACTGAGGTGTTACAACTTGTCAACTTATAGCTGGTAGTATCATT -ATCTATTGGTATTATATCAAGTTTATAAAAAAATGCATATTCTTTCTGCACCTTACCTCT -TATGCTTGTGCTGATATTGAAAGAGCAGTTTTTTATCTCTCCTTTCTCCATTATCATTCT -CCCGCTACTACTATTGGTATTAGTATCATTCTTCAAATCAGTGCACTTTAAACTAACACA -GAGTGGGGTTAATTTTACACATGGCTTTAGGCTTTGATCCCATAAACTGATTATATCCTC -ATGCATCTGTTCTACCATGTCATTTTTCCACATGTTAAAATTTTCTGTCACATTTACCAA -TACTACTTCTTGTGGGTTGGGGTCTGTGGGTACACAGGCATGTGTGGCCCAAACATTATG -TACCTCTGTATCATATGCTTTAGCATCTGATGCACAAAATAGAGTGGTGGTTGCTTCCTT -CCACACAGGTACCCCATAATAGACTGTGACCCACAATTTTTCTGTAGCACTACAGATCAT -CAACATCCCAAGGAGCATGGTGCCCCATCTCCACCCCCATCTCCACAAGTGCTGATATTT -CTCCTTCACTCTCATTGCCACTGTCTTCTGCTCTTTCTATTAGTCTATCAATTAACCTGT -CTATTTTTCTTTGTCTTAATATTTTCCTATATTCTATGATTACTATGGACCACACAACTA -TTGCTATTATTATTGCTACTACTAATGCTACTATTGCTACTATTGGTATAGGTTGCATTA -CATGTACTACTTACTGCTTTGATAGAGAAGCTTGATGAGTCTGACTGTTCTGATGAGCTC -TTCGTCGCTGTCTCCGCTTCTTCCTGCCATAGGAGATGCCTAAGGCTTTTGTTATGAAAC -AAACTTGGCAATGAAAGCAACACTTTTTACAATAGCAATTGGTACAAGCAGTTTTAGGCT -GACTTCCTGGATGCTTCCAGGGCTCTAGTCTAGGATCTACTGGCTCCATTTCTTGCTCTC -CTCTGTCGAGTAACGCCTATTCTGCTATGTCGACACCCAATTCTGAAATGGATAAACAGC -AGTTGTTGCAGAATTCTTATTATGGCTTCCACTCCTGCCCAAGTATCCCCATAAGTTTCA -TAGATATGTTGCCCTAAGCCATGGAGCCAAATCCTAGGAAAATGTCTAACAGCTTCATTC -TTAAGCTCCTCTAAAAGCTCTAGTGTCCATTCATTGTGTGGCTCCCTCTGTGGCCCTTGG -TCTTCTGGGGCTTGTTCCATCTATCCTCTGTCAGTTTCGTAACACTAGGCAAAGGTGGCT -TTATCTTTTTTGGTGTTATTAATGCTGCTAGTGCCAAGTATTGTAGAGATCCTACCTTGT -TATGTCCTGCTTGATATTCACACCTAGGGCTAACTATGTGTCCTAATAAGGCCTTTCTTA -TAGCAGAGTCTGAAAAACAGTCAAAGTAATACAGATGAATTAGTTGGTCTGCTAGTTCAG -GGTCTACTTGTGTGCTATATCTCTTTTTCCTCCATTCTATGGAGACTCCCTGACCCAAAT -GCCAGTCTCTTTCTCCTGTATGCAGACCCCAATATGTTGTTATTACCAATCTAGCATCCC -CTAGTGGGATGTGTACTTCTGAACTTATTCTTGGATGAGGGCTTTCATAGTGATGTCTAT -AAAACCATCCCCTAGCTTTCCCTGAAACATACATATGGTGTTTTACTAAACTTTTCCATG -TTCTAATCCTCATCCTGTCTACTTGCCACACAATCATCACCTGCCATCTGTTTTCCATAA -TCCCTAATGATCTTTGCTTTTCTTCTTGGCACTACTTTTATGTCACTATTATCTTGTATT -ACTACTGCCCCTTCACCTTTCCAGAGGAGCTTTGCTGGTCCTTTCCAAAGTGGATTTCTG -CTGTCCCTGTAATAAACCCGAAAATTTTGAATTTTTGTAATTTGTTTTTGTAATTCTTTA -GTTTGTATGTCTGTTGCTATTATGTCTACTATTCTTTCCCCTGCACTGTACCCCCCAATC -CCCCCTTTTCTTTTAAAATTGTGGATGAATACTGCCATTTGTACTGCTGTCTTAAGATGT -TCAGCCTGATCTCTTACCTGTCCTATAATTTTCTTTAATTCTTTATTCATAGATTCTACT -ACTCCTTGACTTTGGGGATTGTAGGGAATTCCAAATTCCTGCTTGATTCCCGCCCACCAA -CAGGCGGCCCTAACCGTAGCACCGGTGAAATTGCTGCCATTGTCAGTATGTATTGTTTTT -ACTGGCCATCTTCCTGCTAATTTTAAAAGAAAATATGCTGTTTCCTGCCCTGTTTCTGCT -GGAATAACTTCTGCTTCTATATATCCACTGGCTACATGAACTGCTACCAGGATAACTTTT -CCTTCTAAATGTGTACAATCTAGTTGCCATATTCCTGGACTACAGTCTACTTGTCCATGC -ATGGCTTCTCCTTTTAGCTGACATTTATCACAGCTGGCTACTATTTCTTTTGCTACTACA -GGTGGCAGGTTAAAATCACTAGCCATTGCTCTCCAATTACTGTGATATTTCTCATGTTCA -TCTTGGGCCTTATCTATTCCATCTAAAAATAGTACTTTCCTGATTCCAGCACTGACTAAT -TTATCTACTTGTTCATTTCCTCCAATTCCTTTGTGTGCTGGTACCCATGCCAGATAGACC -TTTTCCTTTTTTATTAACTGCTCTATTATTTGATTGACTAACTCTGATTCACTTTGATCT -GGTTGTGCTTGAATGATTCCTAATGCATATTGTGAGTCTGTTACTATGTTTACTTCTAAT -CCCGAATCCTGCAAAGCTAGATAAATTGCTTGTAACTCAGTCTTCTGATTTGTTGTGTCA -GTTAGGGTGACAACTTTTTGTCTTCCTCTATTAGTAACATATCCTGCTTTTCCTAATTTA -GTCTCCCTGTTAGCTGCCCCATCTACATAGAAGGTTTCTGCTCCTACTATGGGTTCTTTC -TCTAACTGGTACCATAATTTCACTAAGGGAGGGGTATTAACAAACTCCCACTCAGGAATC -CAGGTGGCTTGCCAATACTCTGTCCACCATGTTTCCCATGTTTCCTTTTGTATGGGCAGT -TTAAATTTAGGAGTCTTTCCCCATATTACTATGCTTTCTGTGGTTATTTTTTGCACTGCC -TCTGTTAATTGTTTTACATCATTAGTGTGGGCACCCCTCATTCTTGCATATTTTCCTGTT -TTCAGATTTTTAAATGGCTCTTGATAAATTTGATATGTCCATTGGCCTTGCCCCTGCTTC -TGTATTTCTGCTATTAAGTCTTTTGATGGGTCATAATACACTCCATGTACTGGTTCTTTT -AGAATCTCTCTGTTTTCTGCCAGTTCTAGCTCTGCTTCTTCTGTTAGTGGTATTACTTCT -GTTAGTGCTTTGGTTCCTCTAAGGAGTTTACATAATTGCCTTACTTTAATCCCTGGGTAA -ATCTGACTTGCCCAATTCAATTTCCCCACTAACTTCTGTATGTCATTGACAGTCCAGCTG -TCTTTTTCTGGCAGCACTATAGGCTGTACTGTCCATTTATCAGGATGGAGTTCATAACCC -ATCCAAAGGAATGGAGGTTCTTTCTGATGTTTTTTGTCTGGTGTGGTAAGTCCCCACCTC -AACAGATGTTGTCTCAGCTCCTCTATTTTTGTTCTATGCTGCCCTATTTCTAAGTCAGAT -CCTACATACAAATCATCCATGTATTGATAGATAACTATGTCTGGATTTTGTTTTCTAAAA -GGCTCTAAGATTTTTGTCATGCTACTTTGGAATATTGCTGGTGATCCTTTCCATCCCTGT -GGAAGCACATTGTACTGATATCTAATCCCTGGTGTCTCATTGTTTATACTAGGTATGGTA -AATGCAGTATACTTCCTGAAGTCTTCATCTAAGGGAACTGAAAAATATGCATCACCCACA -TCCAGTACTGTTACTGATTTTTTCTTTTTTAACCCTGCGGGATGTGGTATTCCTAATTGA -ACTTCCCAGAAGTCTTGAGTTCTCTTATTAAGTTCTCTGAAATCTACTAATTTTCTCCAT -TTAGTACTGTCTTTTTTCTTTATGGCAAATACTGGAGTATTGTATGGATTTTCAGGCCCA -ATTTTTGAAATTTTCCCTTCCTTTTCCATCTCTGTACAAATTTCTACTAATGCTTTTATT -TTTTCTTCTGTCAATGGCCATTGTTTAACTTTTGGGCCATCCATTCCTGGCTTTAATTTT -ACTGGTACAGTCTCAATAGGGCTAATGGGAAAATTTAAAGTGCAACCAATCTGAGTCAAC -AGATTTCTTCCAATTATGTTGACAGGTGTAGGTCCTACTAATACTGTACCTATAGCTTTA -TGTCCACAGATTTCTATGAGTATCTGATCATACTGTCTTACTTTGATAAAACCTCCAATT -CCCCCTATCATTTTTGGTTTCCATCTTCCTGGCAAACTCATTTCTTCTAATACTGTATCA -TCTGCTCCTGTATCTAATAGAGCTTCCTTTAGTTGCCCCCCTATCTTTATTGTGACGAGG -GGTCGTTGCCAAAGAGTGACCTGAGGGAAGTTAAAGGATACAGTTCCTTGTCTATCGGCT -CCTGCTTCTGAGGGGGAGTTGTTGTCTCTACCCCAGACCTGAAGCTCTCTTCTGGTGGGG -CTGTTGGCTCTGGTCTGCTCTGAAGAAAATTCCCTGGCCTTCCCTTGTAGGAAGGCCAGA -TCTTCCCTAAAAAATTAGCCTGTCTCTCAGTACAATCTTTCATTTGGTGTCCTTCCTTTC -CACATTTCCAACAGCCCTTTTTCCTAGGGGCCCTGCAATTTCTGGCTGTGTGCCCTTCTT -TGCCACAATTGAAACACTTAACAATCTTTCTTTGGTTCCTAAAATTGCCTCTCTGCATCA -TTATGGTAGCTGAATTTGTTACTTGGCTCATTGCTTCAGCCAAAACTCTTGCCTTATGGC -CGGGTCCTCCTACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCCGCTGGTCCCA -ATGCTTTTAAAATAGTCTTACAATCTGGGTTCGCATTTTGGACCAACAAGGTTTCTGTCA -TCCAATTTTTTACCTCCTGTGAAGCTTGCTCGGCTCTTAGAGTTTTATAGAACCGGTCTA -CATAGTCTCTAAAGGGTTCCTTTGGTCCTTGTCTTATGTCCAGAATGCTGGTAGGGCTAT -ACATTCTTACTATTTTATTTAATCCCAGGATTATCCATCTTTTATAAATTTCTCCTACTG -GGATAGGTGGATTATTTGTCATCCATCCTATTTGTTCCTGAAGGGTACTAGTAGTTCCTG -CTATGTCACTTCCCCTTGGTTCTCTCATCTGGCCTGGTGCAATAGGCCCTGCATGCACTG -GATGCACTCTATCCCATTCTGCAGCTTCCTCATTGATGGTCTCTTTTAACATTTGCATGG -CTGCTTGATGTCCCCCCACTGTGTTTAGCATGGTGTTTAAATCTTGTGGGGTGGCTCCTT -CTGATAATGCTGAAAACATGGGTATCACTTCTGGGCTGAAAGCCTTCTCTTCTACTACTT -TTACCCATGCATTTAAAGTTCTAGGTGATATGGCCTGATGTACCATTTGCCCCTGGATGT -TCTGCACTATAGGGTAATTTTGGCTGACCTGATTGCTGTGTCCTGTGTCAGCTGCTGCTT -GCTGTGCTTTTTTCTTACTTTTGTTTTGCTCTTCCTCTATCTTGTCTAAAGCTTCCTTGG -TGTCTTTTATCTCTATCCTTTGATGCACACAATAGAGGGTTGCTACTGTATTATATAATG -ATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTCCCAGTATTTGTCTAC -AGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGCTCCCTGCTTG -CCCATACTATATGTTTTAATTTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTTT -CCCATCGATCTAATTCTCCCCCGCTTAATACTGACGCTCTCGCACCCATCTCTCTCCTTC -TAGCCTCCGCTAGTCAAAATTTTTGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCC -GTGCGCGCTTCAGCAAGCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCCCTTTCGCT -TTCAGGTCCCTGTTCGGGCGCCACTGCTAGAGATTTTCCACACTGACTAAAAGGGTCTGA -GGGATCTCTAGTTACCAGAGTCACACAACAGACGGGCACACACTACTTGAAGCACTCAAG -GCAAGCTTTATTGAGGCTTAAGCAGTGGGTTCCCTAGTTAGCCAGAGAGCTCCCAGGCTC -AGATCTGGTCTAACCAGAGAGACCCAGTACAGGCAAAAAGCAGCTGCTTATATGCAGGAT -CTGAGGGCTCGCCACTCCCCAGTCCCGCCCAGGCCACGCCTCCCTGGAAAGTCCCCAGCG -GAAAGTCCCTTGTAGCAAGCTCGATGTCAGCAGTTCTTGAAGTACTCCGGATGCAGCTCT -CGGGCCATGTGATGAAATGCTAGGCGGCTGTCAAACCTCCACTCTAACACTTCTCTCTCC -GGGTCATCCATTCCATGCAGGCTCACAGGGTGTAACAAGCTGGTGTTCTCTCCTTTGTTG -GCTTCTTCTAACTTCTCTGGCTCAACTGGTACTAGCTTGTAGCACCATCCAAAGGTCAGT -GGATATCTGATCCCTGGCCCTGGTGTGTAGTTCTGCTAATCAGGGAAGTAGCCTTGTGTG -TGGTAGATCCACAGATCAAGGATATCTTGTCTTCGTTGGGAGTGAATTAGCCCTTCCA diff --git a/tests/expected-results-edgy/orfs.json b/tests/expected-results-edgy/orfs.json index 3719cdd..b12e9ab 100644 --- a/tests/expected-results-edgy/orfs.json +++ b/tests/expected-results-edgy/orfs.json @@ -41,9 +41,9 @@ "start": 5558, "end": 5849, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5293125263601849, + "distance": 0.0, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -52,8 +52,8 @@ "name": "tat_exon1", "start": 5829, "end": 6048, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.0, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", @@ -64,46 +64,46 @@ "name": "rev_exon1", "start": 5968, "end": 6049, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.17292490118577064, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", "aminoacids": "MAGRSGDSDEELIRTVRLIKLLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6060, + "end": 6309, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.0, + "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", + "aminoacids": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL*", + "nucleotides": "ATGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6223, "end": 8794, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.005620924829498719, + "distance": 0.0, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", "aminoacids": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL*", "nucleotides": "ATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGAGAATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATAATGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGAATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACACGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA" }, - { - "name": "vpu", - "start": 6258, - "end": 6309, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.0, - "protein": "MGVEMGHHAPWDVDDL", - "aminoacids": "MGVEMGHHAPWDVDDL*", - "nucleotides": "ATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8375, "end": 8471, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.13888888888888895, + "distance": 0.0, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", "aminoacids": "RPTSQPRGDPTGPKEPKKKVERETETDPFD**", "nucleotides": "AGACCCACCTCCCAACCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA" @@ -112,8 +112,8 @@ "name": "rev_exon2", "start": 8376, "end": 8652, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.0, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -124,10 +124,10 @@ "name": "nef", "start": 8795, "end": 9416, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.02294981640146876, + "distance": 0.0, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", "aminoacids": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATAGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA" @@ -175,9 +175,9 @@ "start": 5558, "end": 5849, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5293125263601849, + "distance": 0.0, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -186,8 +186,8 @@ "name": "tat_exon1", "start": 5829, "end": 6048, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.0, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", @@ -198,46 +198,46 @@ "name": "rev_exon1", "start": 5968, "end": 6049, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.17292490118577064, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", "aminoacids": "MAGRSGDSDEELIRTVRLIKLLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6060, + "end": 6309, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.0, + "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", + "aminoacids": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL*", + "nucleotides": "ATGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6223, "end": 8794, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.005620924829498719, + "distance": 0.0, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", "aminoacids": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL*", "nucleotides": "ATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGAGAATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATAATGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGAATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACACGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA" }, - { - "name": "vpu", - "start": 6258, - "end": 6309, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.0, - "protein": "MGVEMGHHAPWDVDDL", - "aminoacids": "MGVEMGHHAPWDVDDL*", - "nucleotides": "ATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8375, "end": 8471, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.13888888888888895, + "distance": 0.0, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", "aminoacids": "RPTSQPRGDPTGPKEPKKKVERETETDPFD**", "nucleotides": "AGACCCACCTCCCAACCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA" @@ -246,8 +246,8 @@ "name": "rev_exon2", "start": 8376, "end": 8652, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.0, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -258,10 +258,10 @@ "name": "nef", "start": 8795, "end": 9416, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.02294981640146876, + "distance": 0.0, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", "aminoacids": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATAGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA" diff --git a/tests/expected-results-large-csv/blast.csv b/tests/expected-results-large-csv/blast.csv index 95436d9..2c4fc32 100644 --- a/tests/expected-results-large-csv/blast.csv +++ b/tests/expected-results-large-csv/blast.csv @@ -1,117 +1,118 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,9386,9635,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,180,1,180,9540,9719,2.04e-69,259,100.000,180,plus,180 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,9497,1,9493,151,9632,0.0,13151,98.473,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG229-T41AG5AG81CA45GA54CG3CA3AGGA18TC32TC11AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA85AG143AG14GA38TC52AG146GA285GA25AG11TC47GA58AG11TG181GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,484,1,484,9236,9719,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,634,1,634,9086,9719,0.0,813,94.795,601,plus,14TCGAGC5GA1AG56GA21GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,9488,9579,2.15e-30,131,98.913,91,plus,18GC73 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9753,1,9689,1,9719,0.0,11990,93.264,9096,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC2-T6GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC32TC1AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA31CA36GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,1,616,9086,9719,0.0,760,92.283,586,plus,24AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,8446,666,9069,1323,9673,0.0,9611,90.161,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC2-T17AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG9TC4TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC46GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC13GA3AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 -MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9719,8140,882,8985,1584,9666,0.0,9469,91.032,7410,plus,6TC32TC59TC77GA5AG17CT17TA5AG29CT8GA32GT23CT6TA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT7GA11CT4CT3AG6AC4AG17GA11TG1TC5ATGAAG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA17AG41CT13AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG57AG7TC32GA11TC56CT69CT45CT39AG95AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA2GA9GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG10GA2TC23TC2AG2AG2AT4CT18CT3GA1CT18AG2TA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG11GA5AG35CT6AC1AG30TA71TC26AG61GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29CA18CG7AGCA22GT99AG92GA13GA14TC23GA32AG17AG2TC34GA31CA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14AT35AG25GA27CA29TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2AT21GT1GC24ACGA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACT6TC6CT4AG23AG23TCCA23GC7TC2-T12AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG33GA20GA10GAGA5GT2CT4GA23AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC2CT1GA2ACCT7TC4TC27TC4TC2TA2GCAC4TG26TA1TA14CT2TG5TC6CA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-4TG5CG20CTAG4CT5AG2-C-T-A4GAGA1CA1CT36AG6GA28CT11CT11CT5CT14TC34AT2-T-G-G7AG14TCGACTAG9AG10TA76CG6CG6AG1CTAT1CG2TG1GACT-G-A-T7TCAC2CT1AG2CGCT1-G-C-G-G-G-A-G-A-A-T-G3GA1AGTG5-G4AG2GA1CA12TC3GA3CG4GATG8AG9AG3CG8CT17GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-C-T-A-T-A-G-5TC2AG7TA5AGCT81GA5GTGA6ACTG16TC5AC6TC51TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC10GA3TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG39GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT10AT4TG2AG1-G-A-C1TCTA5AC10AGGA4GAGA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG69CA36GA46CT46AC5AG14AG8TA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGTAT4TC2ATAC10CG46GA30GA10GT18AT4TC20AGAG20AG37CT22TA7GA2GC28CA1GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG9TC7AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7TG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA16GA25AG1AC28TA13AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT3TC1AG16TA5AG21CT1GA16AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 -MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9719,846,40,881,1539,694,0.0,1076,94.563,800,minus,15CT14GA2GA23CT26CA22AC30AG2TC17AG38CT29GT17TC11AG23CT53CG35GA5AG1TG5GT20TCCT20TC69AGCT13AT8TC7CT17TG1CA75CT2TC29CT6CT31CT6TCTGGA23CT47AT-T-T-T-T12GATG21TC25 -MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9719,582,8404,8985,1,581,0.0,693,91.753,534,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA13AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT3TC1AG16TA5AG21CT1GA4GA11AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 -MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9719,9070,477,9480,577,9627,0.0,10903,92.381,8379,plus,25AG1-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T1AGTA23C-5TG2T-A-GCAT11TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9719,544,8946,9480,1,542,1.17e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9084,652,9689,652,9670,0.0,10957,92.459,8399,plus,15AG51AG25-T-G-A-G-T-A-C-G-C-C-A-A2TA71CTACAGGA17GA25GA6GA5CA38CT39AC17GT34GA29AG15GA25GC3GA51GA1GA5AC6GA4A-C-C-A-G-C-AGCT21AG8TC89AG11CT6CT119TG10AG35GA62TA83CT11AG23GA20TC71AG47TA5AG11GA26GA11TC5AG11AG2GT16CT13GA40AG1GT12TC5CT8TA7TC3AC1AG18AG1GA49CA1AT26AG12CT7GA22AG27GA13TC5ATGA15TC14ACAC7CA4CA12GA9AGAG35GA61CA77AG122TC8AG95CT5AG29AT8GA68CT11AT101CA20CTAG59GA82AG4AT16AG10AC36CT21TC9AG2AG19AG7TC52GT17CT2GA19CT15AC35AG8CT14CT8AG26AC5GA3GA32AG17TC1AG11GA76AG9GA95GA21GA16GA25GA3AG11AG12GA13AG38CT17AG47TC29AG7CT43AG2CA37TA20AG20TC17GA33AC21GA123GA29AT2CA59GA170CT11GA12GA7CT3AC17CA11GACA12AT21AG7AG4AG9CT8AG2GA17CA44CT2TA5GA71TC60GA14TA14CT26CA29GA73AC32TC68GC4CA1CA20AG3AG16AG6GT6AG14AG1AC20AG5TC16AT6CT3CT1GA43CT36GAAG22AG1CA35TC11AC14TG1TC1AT10TC1GT49TC4GA12AG8GA15CT19AG39GAAG12CA6AG3TC11GA27GA27GT23CT8GA18AG14TA9GT18CT2TC2-T33ACAG6CG10AG25AGTA26CT8GA13CA13CA9AT24CA4GC36AG6GA2TG3CA3AGGA9TC41TC4TC2TA2GC5TG26GACTCA21AT8TA31GA24AC3GT15TC20G-G-A-T-C-A-T-G-A-4TA11AG-T-G-G-A-G-A-T-G-G-G-G-G13TC51TC29AG7AC12CT34CT33TC21AG3GT5AT34AG87CG4CA1TG6AG1GT3GA3TA1AG3G-C-A-4GT1A-G-A-1TC5C-A-C-2AG2AGTC2TG1CGTA1ATCG2C-4C-C-A-C-T-2T-2TA1G-T-T-G-G-2GA2AG2GA19CT2CGTCGA12AG6AG4GA5TA3GACT20GA17GAAC2TC2AG5GA3AG1TC19CA79GA4GAATGA4AG1ACTG16AC5AC15GA47CA34AG5ATAC3AT4AG6AG7TC17TCGA9CA4GATA33TA2AC1CG3-C-C-A-G-A-G3GA11GA3TGAT1GA2GACT4GA1T-A-T-7GA1CT2AG4GA6CT4TA1CA3AGCT1AG1AG3CA4GA7ATAT2GA5GA6AGAC19-G-A-A1GT5GA6GA6GATGGC7GA18AGCT2TC1ACTATC39GATC22CTAT5AG1GAGCGTAT1TG6AGCA8GA2GA2GC6CA1AG1-G-A-C-A-C-A5AC10AG28GA34AT4CA6CA2CTGTACGA15TC5CT16GT3GAAG1G-C-T-3G-G-G-2CTAG1CGAT6CT19AG17CA15GA3CT40GA4CA13AG23TACA1CA5CT47GC5AG87AC28AG15GA44CA25CT4AC19AG13CT11TAGC1TG6CA2AC3TC18AC9GA12AG1AT5TC2ATGC9GA1CA8CA28CT1AG8CT12CT15GA4TA4CT11CT6AT47AG2AG26AC7CT30GA3AC26CTCA1GA3CA12CAAG17CT2AGCA6GA1TC4TC3AG3AC9TA3CT7AG13CATG32CT1GA49CT8CT2TC2GA11GT1GA30TC38AG10GT1TG1GA1GACAAG6TG10ACTG36AGGACT5AT4AG8TC2AG9TA5AG1AGGA28AG8AT14ATGA12TC18GA24-A-C-A-G-C-A4AC8AC4AG7GA5CA1A-A-A-4AG11AG2CT10GCGA11CT26CTTG44AC5TC9AG12TC12GA5AC24GA25AGCTTC4TA23TA24GT1GA1GA9ACGC6AG8CAGC1TA14AG6AT18AG4AG7CT2CG25CA5CT5AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 -MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,602,9088,9689,1,585,0.0,679,89.701,540,plus,8AC5TC8ACAG12TC12GA5AC24GA26CTTC4TA23TA26GA1GT7GA1ACGC2TC3AG8CAGC1TA14AG6AT6GA11AG4AG7CT2CG25CA5CT3GA1AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 -MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9719,9061,410,9377,577,9625,0.0,10733,91.855,8323,plus,25-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G3-G-G-A28AGCATC1GT1GA1CATG1-G-A-A-ATG2TA3TC1-G-A-G3AC2CT3-G1TC1TC1-G-G1AC2-GTG2AT2-T-G1GATGGC4CA2-G-C2CG3-CAGCACGTG1AGACAG4-C-T-G-G-TAG4-C-G-C-C3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC13GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9719,542,8845,9377,1,540,2.31e-175,613,90.037,488,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9719,9072,369,9381,577,9624,0.0,10860,92.262,8370,plus,25A-C-TG1ACACTCCT1CT3-T4G-1CT1C-C-C-2A-C-T-28A-G-3T-4TA8TGAG20GA29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 -MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9719,541,8850,9381,1,539,8.58e-176,615,90.203,488,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,9152,512,9583,577,9686,0.0,10851,91.882,8409,plus,24-A-G-A-C-C2-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27-G-G2T-3GATA1AG1TG1GA2A-T-C-C-C-T-C-T-2TA3TC4A-TGCACG3AT1CT1CG1A-A-T-29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,668,8973,9614,1,649,0.0,688,86.976,581,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,79,273,351,577,649,8.05e-10,64.0,78.481,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-CTCGCGTA27 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,81,405,485,577,649,5.83e-09,61.1,76.543,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-C-A-CTCGCGCA27 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,31,273,303,9662,9692,8.42e-04,44.0,96.774,30,plus,28TC2 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,31,405,435,9662,9692,8.42e-04,44.0,96.774,30,plus,28TC2 -MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9719,9112,34,9126,646,9679,0.0,10568,90.935,8286,plus,21AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC12AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG38AG7AG20AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA27AT30AG4TC50GA57TC9CT7GA17CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTAG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA7AC11CTCT12TC4CT2TC2-T17AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3T-1TC2-A2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2-A1GA1CACT1GTGC2GC1AC2AG1C-AG1CAAG2-G-G-GTG14TC1TA2TC11GT7AC8-T-A3-A3CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-T-2AG2T-C-T-AG3CGGACTCA4CT1ACTC4C-T-T-6AGTCAGAGTG1C-TG3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11G-A-A-G-G-T-1GA2G-A-A-7G-G-G-2AGAC4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10-A-A-A3-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT5AG8A-T-G-7TAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12A-A-G-C-A-A-CT5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG5CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC8A-C-C-C-T-A-G-A-T-1GT4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT8AG20CT8GA2AG2GT7TA11AC26CT8GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC27AG3AC1GTTG6CG2GA9C-A-G-8AG19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 -MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9719,598,8529,9126,1,594,0.0,670,89.632,536,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 -MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9719,33,1,33,702,670,1.52e-05,49.7,100.000,33,minus,33 -MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9719,9071,458,9461,577,9625,0.0,10898,92.382,8380,plus,25-G-A3-T-T-T3-T-C-A-G-T-G-T-G-G-A-A-A20C-G-1A-G-G-C-2TAAG17TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9719,542,8929,9461,1,540,8.47e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9719,9036,130,9032,649,9627,0.0,10320,90.317,8161,plus,18AG72-A-C-T-G-G-T-G-A-G-T-A-C-G-C-C-A-A-A-A-A47GA23CTACAG6GA31GA6GA29AG2GA75GT19GA7AG8TA13GATC20AG48AG20GAAG28TC1AG2GACT35GC53GA20AT2TC11AG17CA29GA38TC17AG2TC30TG22GT23GA2GA23CT2CT14GA47CT2CT47TC59TC77GA5AG14AG2CT17TA5AG29CT8GA32GT23CT3AGAC1GA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT19CT4CT3AG5GAAC4AG17GA11TG1TC5AT1AG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA8CA4AG3AG55AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG25GA31AG7AC32GA11TC56CT69CT5AG13AG25CT39AG83TA11AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA12GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG13TC23TC2AG2AG2AT4CT18CT3GA1CT18AG1TCTA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG8AT2TA5AG35CT8AG9AG52TC39TC26AG25TC35GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29TA18CG7AGCA10GA11GT99AG92GA13GA14TC23GA32AG13TC3AG2TC34GA30AGCA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14CT35AG25GA57TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2GT21GT1GC25GA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACTAT5TC2CT3CT4AG23AG23TCCA9CT13GC7TC2-T12AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG2GA30GA20GA11GA8CT4GA14GA8AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC1AGCT4ACCT7TC4TC7AG4GA14TC4TC2TA2GCAC4TG26TA1TA14CT2TG5TC6TA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-3GA6CG17GT2CTAG4CT5AG2-C-T-A5GA1CA1CT36AG35CT11CTCA10CT5CT14TC34AT2-T-G-G22TCGACTAG9AG10TA76CG6CG8GT9AGGACT4CA2TCAC2CT1AG2CGCT2TC-G-G-G2TA2-G1GT2-T-G-G-A1-A7AG2GA8TC5TC3GACT2CG4GACGAC7AG9AG3CG8CT9GA7GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-A-T-A-T-A-G-5TC2AG7TA2GT2AGCT51-T-T-G-T-G-C-C-C-C-G-G-C-T1-G-T-T-T-T-G-C-G-A-T-T-C-T-A-A-A-A-T-G-T-A-A-T-A-A-T-A-A-G-A-C-G-T-T-C-A-A-T-G-G-A-A-C-A-G-G-A-C-C-A-T-G-T-A-C-A-A-A-T-G-T-C-A-G-C-A-C-A45TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC14TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG3AC35GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT7TC2AT4TG2AG1-G-A-C1TCTA5AC10AGGA5GA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG29AG39CA36GA46CT46AC5AG14AG8CA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGT5TC2ATAC10CG46GA22CA7GA10GT18AT4TC20AGAG20AG60TA7GA2GC28CA1GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG17AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7CG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA16GA25AG1AC28TA9GA3AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT5AG2TG1AG11TA5AG21CT1GA16AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 -MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9719,543,8492,9032,1,542,4.15e-180,629,90.792,493,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA9GA3AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT5AG2TG1AG11TA5AG21CT1GA4GA11AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 -MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9719,150,1,129,782,633,2.35e-34,145,84.667,127,minus,23-T-T-T-T-T-G-G-C-G-T-A-C-T-C-A-C-C-A-G-T72TC12AG16-C4 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,9385,9634,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,180,1,180,9539,9718,2.04e-69,259,100.000,180,plus,180 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,9496,1,9493,151,9631,0.0,13155,98.484,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG270AG5AG81CA45GA54CG3CA3AGGA18TC44AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA24TCAC59AG143AG14GA38TC52AG146GA311AG11TC47GA58AG11TG181GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,484,1,484,9235,9718,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,634,1,634,9085,9718,0.0,816,94.953,602,plus,14TCGAGC5GA1AG78GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,9487,9578,2.15e-30,131,98.913,91,plus,18GC73 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9752,1,9689,1,9718,0.0,12000,93.294,9098,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC8GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC34AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA30TC37GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,1,616,9085,9718,0.0,763,92.441,587,plus,24AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,8445,666,9069,1323,9672,0.0,9616,90.172,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC19AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG14TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC16TCAC28GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC17AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9718,8139,882,8985,1584,9665,0.0,9479,91.068,7412,plus,6TC32TC59TC77GA5AG17CT17TA5AG29CT8GA32GT23CT6TA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT7GA11CT4CT3AG6AC4AG17GA11TG1TC5ATGAAG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA17AG41CT13AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG57AG7TC32GA11TC56CT69CT45CT39AG95AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA2GA9GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG10GA2TC23TC2AG2AG2AT4CT18CT3GA1CT18AG2TA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG11GA5AG35CT6AC1AG30TA71TC26AG61GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29CA18CG7AGCA22GT99AG92GA13GA14TC23GA32AG17AG2TC34GA31CA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14AT35AG25GA27CA29TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2AT21GT1GC24ACGA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACT6TC6CT4AG23AG23TCCA23GC7TC14AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG33GA20GA10GAGA5GT2CT4GA23AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC2CT1GA2ACCT7TC4TC32TC2TA2GCAC4TG26TA1TA14CT2TG5TC6CA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-4TG5CG20CTAG4CT5AG2-C-T-A4GAGA1CA1CT36AG6GA28CT11CT11CT5CT14TC34AT2-T-G-G7AG14TCGACTAG9AG10TA76CG6CG6AG1CTAT1CG2TG1GACT-G-A-T7TCAC2CT1AG2CGCT1-G-C-G-G-G-A-G-A-A-T-G3GA1AGTG5-G4AG2GA1CA12TC3GA3CG4GATG8AG9AG3CG8CT17GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-C-T-A-T-A-G-5TC2AG7TA5AGCT81GA5GTGA6ACTG16TC5AC6TC51TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC10GA3TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG39GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT10AT4TG2AG1-G-A-C1TCTA5AC10AGGA4GAGA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG69CA36GA46CT46AC5AG14AG8TA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGTAT4TC2ATAC10CG46GA30GA10GT18AT4TC20AGAG20AG37CT22TA7GA2GC27TC2GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG9TC7AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7TG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA42AG1AC28TA13AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT3TC1AG16TA5AG21CT1GA16AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 +MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9718,846,40,881,1539,694,0.0,1076,94.563,800,minus,15CT14GA2GA23CT26CA22AC30AG2TC17AG38CT29GT17TC11AG23CT53CG35GA5AG1TG5GT20TCCT20TC69AGCT13AT8TC7CT17TG1CA75CT2TC29CT6CT31CT6TCTGGA23CT47AT-T-T-T-T12GATG21TC25 +MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9718,582,8404,8985,1,581,0.0,693,91.753,534,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA13AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT3TC1AG16TA5AG21CT1GA4GA11AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 +MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9718,9069,477,9480,577,9626,0.0,10913,92.414,8381,plus,25AG1-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T1AGTA23C-5TG2T-A-GCAT11TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9718,544,8946,9480,1,542,1.17e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9083,652,9689,652,9669,0.0,10973,92.513,8403,plus,15AG51AG25-T-G-A-G-T-A-C-G-C-C-A-A2TA71CTACAGGA17GA25GA6GA5CA38CT39AC17GT34GA29AG15GA25GC3GA51GA1GA5AC6GA4A-C-C-A-G-C-AGCT21AG8TC89AG11CT6CT119TG10AG35GA62TA83CT11AG23GA20TC71AG47TA5AG11GA26GA11TC5AG11AG2GT16CT13GA40AG1GT12TC5CT8TA7TC3AC1AG18AG1GA49CA1AT26AG12CT7GA22AG27GA13TC5ATGA15TC14ACAC7CA4CA12GA9AGAG35GA61CA77AG122TC8AG95CT5AG29AT8GA68CT11AT101CA20CTAG59GA82AG4AT16AG10AC36CT21TC9AG2AG19AG7TC52GT17CT2GA19CT15AC35AG8CT14CT8AG26AC5GA3GA32AG17TC1AG11GA76AG9GA95GA21GA16GA25GA3AG11AG12GA13AG38CT17AG47TC29AG7CT43AG2CA37TA20AG20TC17GA33AC21GA123GA29AT2CA59GA170CT11GA12GA7CT3AC17CA11GACA12AT21AG7AG4AG9CT8AG2GA17CA44CT2TA5GA71TC60GA14TA14CT26CA29GA73AC32TC68GC4CA1CA20AG3AG16AG6GT6AG14AG1AC20AG5TC16AT6CT3CT1GA43CT36GAAG22AG1CA35TC11AC14TG1TC1AT10TC1GT49TC4GA12AG8GA15CT19AG39GAAG12CA6AG3TC11GA27GA27GT23CT8GA18AG14TA9GT18CT2TC35ACAG6CG10AG25AGTA26CT8GA13CA13CA9AT24CA4GC36AG6GA2TG3CA3AGGA9TC46TC2TA2GC5TG26GACTCA21AT8TA31GA24AC3GT15TC20G-G-A-T-C-A-T-G-A-4TA11AG-T-G-G-A-G-A-T-G-G-G-G-G13TC51TC29AG7AC12CT34CT33TC21AG3GT5AT34AG87CG4CA1TG6AG1GT3GA3TA1AG3G-C-A-4GT1A-G-A-1TC5C-A-C-2AG2AGTC2TG1CGTA1ATCG2C-4C-C-A-C-T-2T-2TA1G-T-T-G-G-2GA2AG2GA19CT2CGTCGA12AG6AG4GA5TA3GACT20GA17GAAC2TC2AG5GA3AG1TC19CA79GA4GAATGA4AG1ACTG16AC5AC15GA47CA34AG5ATAC3AT4AG6AG7TC17TCGA9CA4GATA33TA2AC1CG3-C-C-A-G-A-G3GA11GA3TGAT1GA2GACT4GA1T-A-T-7GA1CT2AG4GA6CT4TA1CA3AGCT1AG1AG3CA4GA7ATAT2GA5GA6AGAC19-G-A-A1GT5GA6GA6GATGGC7GA18AGCT2TC1ACTATC39GATC22CTAT5AG1GAGCGTAT1TG6AGCA8GA2GA2GC6CA1AG1-G-A-C-A-C-A5AC10AG28GA34AT4CA6CA2CTGTACGA15TC5CT16GT3GAAG1G-C-T-3G-G-G-2CTAG1CGAT6CT19AG17CA15GA3CT40GA4CA13AG23TACA1CA5CT47GC5AG87AC28AG15GA44CA25CT4AC19AG13CT11TAGC1TG6CA2AC3TC18AC9GA12AG1AT5TC2ATGC9GA1CA8CA28CT1AG8CT12CT15GA4TA4CT11CT6AT47AG2AG26AC7CT30GA3AC29GA3CA12CAAG17CT2AGCA6GA1TC4TC3AG3AC9TA3CT7AG13CATG32CT1GA49CT8CT2TC2GA11GT1GA30TC38AG10GT1TG1GA1GACAAG6TG10ACTG36AGGACT5AT4AG8TC2AG9TA5AG1AGGA28AG8AT14ATGA12TC18GA24-A-C-A-G-C-A4AC8AC4AG7GA5CA1A-A-A-4AG11AG2CT10GCGA11CT26CTTG44AC5TC9AG12TC12GA5AC50AGCTTC4TA23TA24GT1GA1GA9ACGC6AG8CAGC1TA14AG6AT18AG4AG7CT2CG25CA5CT5AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 +MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,602,9088,9689,1,585,0.0,679,89.701,540,plus,8AC5TC8ACAG12TC12GA5AC24GA26CTTC4TA23TA26GA1GT7GA1ACGC2TC3AG8CAGC1TA14AG6AT6GA11AG4AG7CT2CG25CA5CT3GA1AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 +MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,160,1,159,9085,9244,4.40e-48,191,91.875,147,plus,8AC5TC9AG12TC12GA5AC50AGCTTC4TA19-T3TA14GT6 +MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9718,9060,410,9377,577,9624,0.0,10743,91.887,8325,plus,25-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G3-G-G-A28AGCATC1GT1GA1CATG1-G-A-A-ATG2TA3TC1-G-A-G3AC2CT3-G1TC1TC1-G-G1AC2-GTG2AT2-T-G1GATGGC4CA2-G-C2CG3-CAGCACGTG1AGACAG4-C-T-G-G-TAG4-C-G-C-C3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC39AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9718,542,8845,9377,1,540,2.31e-175,613,90.037,488,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9718,9071,369,9381,577,9623,0.0,10870,92.294,8372,plus,25A-C-TG1ACACTCCT1CT3-T4G-1CT1C-C-C-2A-C-T-28A-G-3T-4TA8TGAG20GA29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 +MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9718,541,8850,9381,1,539,8.58e-176,615,90.203,488,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,9151,512,9583,577,9685,0.0,10861,91.913,8411,plus,24-A-G-A-C-C2-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27-G-G2T-3GATA1AG1TG1GA2A-T-C-C-C-T-C-T-2TA3TC4A-TGCACG3AT1CT1CG1A-A-T-29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,668,8973,9614,1,649,0.0,688,86.976,581,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,79,273,351,577,649,8.05e-10,64.0,78.481,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-CTCGCGTA27 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,81,405,485,577,649,5.83e-09,61.1,76.543,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-C-A-CTCGCGCA27 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,31,273,303,9661,9691,8.42e-04,44.0,96.774,30,plus,28TC2 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,31,405,435,9661,9691,8.42e-04,44.0,96.774,30,plus,28TC2 +MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9718,9111,34,9126,646,9678,0.0,10578,90.967,8288,plus,21AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC12AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG38AG7AG20AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA27AT30AG4TC50GA57TC9CT7GA17CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTAG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA7AC11CTCT12TC4CT2TC19AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG13T-1TC2-A2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2-A1GA1CACT1GTGC2GC1AC2AG1C-AG1CAAG2-G-G-GTG14TC1TA2TC11GT7AC8-T-A3-A3CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-T-2AG2T-C-T-AG3CGGACTCA4CT1ACTC4C-T-T-6AGTCAGAGTG1C-TG3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11G-A-A-G-G-T-1GA2G-A-A-7G-G-G-2AGAC4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10-A-A-A3-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT5AG8A-T-G-7TAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12A-A-G-C-A-A-CT5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG5CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC8A-C-C-C-T-A-G-A-T-1GT4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT8AG20CT8GA2AG2GT7TA11AC27AC7GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC27AG3AC1GTTG6CG2GA9C-A-G-8AG19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 +MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9718,598,8529,9126,1,594,0.0,670,89.632,536,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 +MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9718,33,1,33,702,670,1.52e-05,49.7,100.000,33,minus,33 +MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9718,9070,458,9461,577,9624,0.0,10908,92.415,8382,plus,25-G-A3-T-T-T3-T-C-A-G-T-G-T-G-G-A-A-A20C-G-1A-G-G-C-2TAAG17TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9718,542,8929,9461,1,540,8.47e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9718,9035,130,9032,649,9626,0.0,10330,90.349,8163,plus,18AG72-A-C-T-G-G-T-G-A-G-T-A-C-G-C-C-A-A-A-A-A47GA23CTACAG6GA31GA6GA29AG2GA75GT19GA7AG8TA13GATC20AG48AG20GAAG28TC1AG2GACT35GC53GA20AT2TC11AG17CA29GA38TC17AG2TC30TG22GT23GA2GA23CT2CT14GA47CT2CT47TC59TC77GA5AG14AG2CT17TA5AG29CT8GA32GT23CT3AGAC1GA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT19CT4CT3AG5GAAC4AG17GA11TG1TC5AT1AG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA8CA4AG3AG55AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG25GA31AG7AC32GA11TC56CT69CT5AG13AG25CT39AG83TA11AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA12GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG13TC23TC2AG2AG2AT4CT18CT3GA1CT18AG1TCTA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG8AT2TA5AG35CT8AG9AG52TC39TC26AG25TC35GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29TA18CG7AGCA10GA11GT99AG92GA13GA14TC23GA32AG13TC3AG2TC34GA30AGCA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14CT35AG25GA57TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2GT21GT1GC25GA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACTAT5TC2CT3CT4AG23AG23TCCA9CT13GC7TC14AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG2GA30GA20GA11GA8CT4GA14GA8AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC1AGCT4ACCT7TC4TC7AG4GA19TC2TA2GCAC4TG26TA1TA14CT2TG5TC6TA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-3GA6CG17GT2CTAG4CT5AG2-C-T-A5GA1CA1CT36AG35CT11CTCA10CT5CT14TC34AT2-T-G-G22TCGACTAG9AG10TA76CG6CG8GT9AGGACT4CA2TCAC2CT1AG2CGCT2TC-G-G-G2TA2-G1GT2-T-G-G-A1-A7AG2GA8TC5TC3GACT2CG4GACGAC7AG9AG3CG8CT9GA7GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-A-T-A-T-A-G-5TC2AG7TA2GT2AGCT51-T-T-G-T-G-C-C-C-C-G-G-C-T1-G-T-T-T-T-G-C-G-A-T-T-C-T-A-A-A-A-T-G-T-A-A-T-A-A-T-A-A-G-A-C-G-T-T-C-A-A-T-G-G-A-A-C-A-G-G-A-C-C-A-T-G-T-A-C-A-A-A-T-G-T-C-A-G-C-A-C-A45TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC14TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG3AC35GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT7TC2AT4TG2AG1-G-A-C1TCTA5AC10AGGA5GA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG29AG39CA36GA46CT46AC5AG14AG8CA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGT5TC2ATAC10CG46GA22CA7GA10GT18AT4TC20AGAG20AG60TA7GA2GC27TC2GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG17AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7CG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA42AG1AC28TA9GA3AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT5AG2TG1AG11TA5AG21CT1GA16AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 +MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9718,543,8492,9032,1,542,4.15e-180,629,90.792,493,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA9GA3AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT5AG2TG1AG11TA5AG21CT1GA4GA11AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 +MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9718,150,1,129,782,633,2.35e-34,145,84.667,127,minus,23-T-T-T-T-T-G-G-C-G-T-A-C-T-C-A-C-C-A-G-T72TC12AG16-C4 MK115158.1,Ref.47_BF.ES.08.P1942.GQ372987,0,9143,8926,8919,162,9029,68,8923,0.0,9530,87.790,7830,plus,27A-C-C-T-2T-A-2TCAC2GA1TG1CGCACA1CGCT1AG1T-C-TA1TC3CGTA38AT1AG21-C-T-G-G-T-G-A-G-T3-C-C-A-A-A-A-A-T-T-T-T43GA20AG2CT1AG6GA20GA9CAAC6GA2AG26AG2GA11ATGC82GA7AG4TC8AG8GATC20GA3AC2GTAG25CT2GA11AG21AGCT6A-G-C-10CA9GA37AGTCGC8AC3GA8GC1CT2AT26GA2AG2AG8GA38CA12GTCG15GA5GC3CT4CT23TC9TC7AC2TC2CT23TC5GA17GA2GT2TCGC16AG5GT11CT5AT5CT17GA6GCGA11AGTC2TC6AG7AG5AT5CT11AC5GA29TC3AGCT7CT9GA6AG5GA14CT5AG3CA6AT4AGCTTC18TA7GT35GA3GT1AG32AG2TA3GCCAAG32GA11AG11GA14GA16TC4AGACCT3GACA1TGCT1GA1GA19TA4AG4AG8GT2TC19AG17GA23GA12AG8GA20TC2TC5GA8AT17CT9CAAG18CT4CTTC2AG1GA3AGAC4AG11AG4ACGA8CGAG1TG5GA2AGAG2A-C-A-5TC2TC4AC9GA1CA2TA2A-C-C-3AG3AG2CT3-C-C-CAT1GATG9AG21TC12GAGAAG7GA2AGCA1AG38GA8AC2GA1GA1CT1AG7GA6GA40AG12GA3-A3G-14CA1TG21AG19TC26GA8TC47AG22GAAG2TC14GA2AG22CT6TC4ACGA23TC36AG7AC20TA11GA26GA11CT2CT5AG17AG2CT2CT5GA27CT1GA8TA21CT2GT2AG4CA8AG101CT5TC8AG1GA24AG11GA2TG2AC63GA22GATC4GA6TC4CT32AC2TC20CA30CGATAG4CA3GA2AG4GA15TC8AG11GA23TC17GA2GA5TC1AG3AC5AG3GA7GA8ACGA14GA4AG32CTCT13GA5AG15AT40TC17TC5AG14CTTC22AGAT10TC16AG3AG24GA25AG2GA2CT20TA4AG3AG9TA13AC14TC32TC2CTTC4GA2AG17AG50TC2AG2AG2AT4CT18CT3GA1CT1GA9AG6AG19AC26TC1AT9GA41AG20GA14AG2CT8GA30CA1AC18GT22AG5GA26CT3TG10AG2GA11GA5AG8GA11TA16GA9AG8TC5CT8AC8AG11AG28TA52TC26AG22AG2TC35GA5AG49CA22CACG3CT8TC1AC1GA25AG3GA4AG2AG38TA11GA5AGCG7AGCA14GA7GT26AG34AG37AG20AC73TC3CG22TA2TC11GA8AG2AC8TC8CA11AG17AG2TA34GA10AG19AG2TAGA14AT16AC4GAGA3GA2TC1GAGAGAGA5GTTC3AC9AT9AG7GA6TC3GA13AW4GAAG1GA3GAGACA2GA1CT7GA14CT3CA7AG23AG21AC1AGAG3GAAG5CG6GA9AG3AG11AG6CA1GA9AG25AGCA25TC9GA1AC17TC14GA2GA2CT10TC10CG1ATCA4AG1GA1AGGC6AG14GCACGA4CTGTGAAGCT1GRARGA2TC9GA9GA44AG8AG10GAAT8TC2GA2CT9GC7TC2CT3CT1GA14TCGA1AC2TC5AG10CAAG5GT6CA7AG2TG8AT2GAGC7TC14AG2TCCA1GT2CT4GAGA9CA2ACCGCA2TG6GA29GA20GA2TC17CT4GATA2CT8AG1AGGA7AT8CAGACGGTAT6TA54GR1AC8GAAGTCAGAGCT4ACCT7TA4TC7AG10TC1CT13CT5AG18TC11TGTCTA3AT13TG33ATGT4CG3AGGA1GA1AG2GT1CT1GAGAAT2CA4TC38TC2AG2GA2CT11GAGT4CACA1CG5GA1TG4AC1CT1AT5AC2TG2GAGT2GTGAG-C-C-A-C-C-3CA2C-T-T-G-G-G-A-3C-4A-C-3TA2TA1-T1AT3GA1CG1CT72CT2AG8CT7TC3CT5CT14TC30GA1AGGTAT3-G-A-A21TCGACTAG8TC23GA8CT41CA5CT8TC5CT4CA1GA1-T-A-C-T2-C-A-C-C-A-C-T-A-A2-C-T-A-G-C1AT5GACT1CG15CT2TC5TC3GACT6ACGCCA2TCAG4A-T-A-A-2TA1CA2AG1-G1CG18GAAC11AG3A-3A-1GA2-C-A2TC2TA2CT2C-T-A-T-A-A-3CT2AC13AG7TA5AGCT12CT9GA37GA26GT6AC1TG16TC4GA7TC29AG18CT2TC13TC10GA4GA2GA4TC2AG3AC5TA4TAAG1CT1GA3TACA3CG12AG2AG2CT3AT2GA2GAAGAC10CT7AGAG27AG8GC1GAAG1CT18CT9GA30GA13GA1GC7AG1AC7TCGAAGTA6AG1GA11AC1GAGTGA1GA14CT23GA11CT1GC6TC3AG29CTAC15TA3AG1TG1GA1AGCA4GAGAATGA1AT1AC2GAT-A-C-2GA1GT6AGTCAT4AT1T-1AC1TC1T-T-10CA6GA5GA6GA5AT47CT1AC4GATC14TC8AGCA2CT2CG18GA2AGTAG-3CA1G-A-1AG1C-A-C-2CG3AG1TC11GA7GA6GAAG39CA17GA18GA19GC17AT1AT6CT46AG3AG1AGAG13AG7AT21AG12TC7AG29GA47AG11TA12CA2CA26CTTA13AGAC14GC3TC12ATAC1CT-A3G-1TC1TG2CT5TG35CT9GAAGGT10AG8AC2AT7AG40TC11TC7CA13AT4GC23TC21AG4TA15AG1TAGA34TC8AG2GA2TC7TA2TA6CTGC21AG8GA34AG3AGCA1TCAG3CAAGTC12AC8GA7GA10TG41TC7GAGTAT30GCCT6GA2TC8TC5GA11CT20TCGA1CT8CT2CTGA7CA4CT21GATA9TCAT8ATAGTC1TGTG7AG2AC12CG18GA11GA13GAGA2TAAG1TGCG6CA3AG1GAGTGA1GT3GA6GA1AT14GA6GA1TC1ACGT3GACT6TA5AG7CTAC11-A6A-8TACA9AG3TC3CG7CT3GC4TC1GTTG18G-A-A-5GT2AG5GA2TC38AT12GT1AC9CTAT39CT3CAAGAGCA10TG11GA5CT3AC7GA2CA39AG1AC2AG6CT10AG17GA3AG1GT2AC8TG13CA9GAGA5ATTG4TC7TCGA3AG3GA5GA5CG2CTTGCA3GC8GATC1AGGA16CA1GA8TCCTCAGATG5GA9AC13CT6AG10GT24GA2AG10AGGA6CT3AGAC31AG2 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,9386,125,9411,380,9719,0.0,10743,90.550,8499,plus,41GC19CT1CT3TC53GA104AC10CT37CT11TGAGGA11AC37AG22CT12-A-A2TA62CA9AC7GA38GA44GA29GA8GA23GA8AG19AG8TA7AG5GATC3TC5CT2AG14TGGA20CT2AG1TC35GA27AC6GA4A-G-C-A-G-T-C-A-A-30CAATTC15TC7TCCA58CA2GA2AG80GA57TG10AG59GA39CA47AC4GA31TC30AG5TC8TC47AG62CT3CT10AG8AG38GA2GA6AG4CT2AG8CT22CT4G-G-T-GAGA1GT2AG3AC14AG19GA4AGCACT1AG32CATC3TC68CT2CTTA28AG12CT22CT2CT4AG41TC5AT10GA24CT18CT2CATA9AGAG29GA84AG60AG4CT40AG44AC31TC8AG20AG80AG56CA20GA2TC17GA17GA8AG14TC5GA59AG20CT8TC9AGGA6AG28CTTA14CA8GA50TC14GA11AG35CT17AG2CT22AG10GA5GA5AG1CG6GC1GA18TC19GA20TC11CT92AG26TCGC15AG21GA3GA1TC2GA14GA3AC26TC68GA28TC8CA44GA10CTAG29GA8AG5TG9GA7GA9GA12TC11GA1TC1AG8GA2AG22TCGA41CT1GA15AG47TC23TC2AG9ATAT22GA1CT8GA9AG2CA2TC41CT19AG65CTAC1GA50GA8CT3AG61AT12AG10GA20GA2AT2TA14TC10AG22AC1AG8GA11GA3AG31GA72AG16CT14GA2CT26GA20CT3AC1CT31TC9AT2TC5TC12AG1CTAG4AG2CT1AG9CT8AG2TAGA1TC8GA38GA124AG4TA17AG35CT56GA13GA14GC44AC2CA8AG100CT20AG5AGAG8AG7GT4CT5CT12AC48AG57CT37AG17GACA21AC4CT2TC5TC11AC12CA1AG3AT10TC1GT6TC5TG38GA6CT12TC4GA2GA34CTGA3GA29GA5TC14AG6TC11GA7AG19GAGT24GAATAT9AG7AG26CT14AG1GA15AT9TC1AG8TC2-T17AGCA8GA6AG1-T3-C-G-A-C-A7AG14CA14GA2AG28GAGA3CG6AC21CT20CT4CT2AC3GA1GC31CA5AC5GA2CG3CA2GAAGGA9TC8TC1CT5CT4AG19TC7TA2GCACGA3TGCT23TC1GACT22AT8CA2TA4GA17GA4AGGA11AG6AG5AC3GTTA32CA2GA2TACAAT1GTAC2AC1-C4CG-G2CA1CGTGTGAG-G12GA2TA10AG24-G-A2CA1-T37AG2TA17CT33AG44GA17CT3AT17AT3TC3GT1AG6AG7GA57CATACA9TC7CT1CG6TG9GTCTTG2CG1T-C-1CTCG1GTC-7ACTC1GA3A-G-A-2AGGT1AGGC1A-A-6AT1T-1CT1TA4G-G-A-G-A-C-9AG23GC1CGTCTA7GA2CA1AG4TGCTTG6CG2CTGA4CT10GA6GA1GAGA3AC7GA1G-A-C-1AG3AC2ACTC2TC4GA5TC19GA1CT8TC20TG5CT2TC38GA13ACAG22AC35AGAG2TA5GA5CT17TC17AG3AG1GA10ATAC9AG22GA8GC3CT5CG40GA2ACAC4GC-C-A-G-A-G-A13TC1AT2TGAT1GA3CT4CA1A-A-T-7GA4AG3AC10CT15GA9CAAC8GA7TC2CGACCA8AG1GA2GA1-T-T2-A-A-A-T4GA3CA11CGTCCA27GA1TC16AG23AT5AC4AG15CTCTA-C-G-14AGT-A-A-16GA8-G-G-A-A-G-T-G-A-C1TC6AC5GA18GA6GT7GA7CA24CAAGAT11TA27CT2GATCTA11AT1TA2AG2CA2GA4ATGCC-A-A-5CT60GA83GAC-T-G-6AT11CT34GC3GA5TC11AG6TA21AG12CT22GA35AG15CA4AG18CA16AG29CT9AG13CTAG15GA4TCATTG3GC1TG8CTAC3TC18AC1AG7GA11GA8TC2AT11AG7GA8GA4TAAG12CT5TGCA3GA5GA8CTCT16TC27AT26AG58CT8GA2AG2GT7CA2GT4GA4AG22AG3CA7GA9AG17ACGA1GT10CATC4TC3CG6TA13AG2AG25AG13AC11GATC4GA8AC49GA5CT12AC14AG1CT11CT8TC26AGAG1CT4GA10AG2AG4GT6TA2ACTG12GA17TG6GACT19AC2AG10AGGT4GT1GAGT10GA12AG5AGGA3AG16GTGA28CA3TC29CGACGT6CG3AC24AG5AG5AG2CT10GC3CT11GA26GA3AC1GT52AGGA29TC25GA3AG2TC42GT6TA4-C4-A-C-C-A2-T1TA3CA1-A1CATA1TA1GATGGATA2CGTG1TCGAGA3CATG-G5TA1CA1-C-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA3AG1AT-G-G2CGTA1-C-C-G-G-A-G-A-G-A-G-A-A-G-T-G-T3C-5CA1CGCTCTGTAG4GCGCAG3-A1AC1ATGTCTGC1-T-C1AC2AG1ACAC1CG4GCAT1-C3TC-G-G-A-G-T-A2CTGC1CA1CA1GC-T-G-C-T3-A3-A7GA-C-A2CG1-A-C-T-T-T-C3ATCGAG1CG1-C-T-T-T-C-C2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,635,8840,9411,1,634,9.31e-121,432,76.535,486,plus,23ACAGGA29TC25GA3AG2TC18GA23GT6TA4-C4-A-C-C-A-GGT2TA3CA1-ATGCATA3-A1TAGATGGA1CGTC1TAGAGCTA2CGTG5TA1-A2-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA5-T-G-G-A-T-G-A-C-C-C-G-G-A-G-A-G-A-G2TGCTTGCT3C-5CA1CGCTCTGTAG4-C-C-G-C-C-T-A1GC1-T-T-T1CA1GC1-C1AT1-G-C-C3AG2-C1AGGC1AT2AG3GT1GCAT2TACATGCAGAACCT2AT1GAACCA3-A7-A-C-A-A-G-G2-C-T-T-T-C-C2-T1CG1CG2-TATGT1AC2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,255,125,379,9465,9719,5.83e-95,346,97.255,248,plus,41GC19CT1CT3TC53GA104AC10CT17 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,211,8973,9182,544,749,1.01e-65,249,92.417,195,plus,62AC10CT49TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,151,1,150,604,749,4.57e-39,161,88.742,134,plus,2AC10CT37CT11TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,91,8973,9063,9629,9719,9.52e-29,126,97.802,89,plus,62AC10CT17 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,9377,104,9441,402,9683,0.0,9753,86.765,8136,plus,19GC21CT24GA78TC55GA1TC1A-A-AT1CT1GA2C-2AGCTCGAT1A-2GA1CACT1ATGC37TGAGGA8AG2AC49AGAG22-A-A-A1TA11AG15AG4AG20GA3AG1AG12AC3AG3GA7AG10AG2AG15GA17AG8AG3AG43GA8AG3GA3TC1AG1AG25AG37CA10AG3AG7AG6TGGA13AG5GT8AGGA4AG26GA11GA12AG2AC4ACGAGACT3AGCT3TC7TA16CA1AC2AG8AG37AGAG17AG2AG17AG53TC14AGAG1TGAG4CT8TC15AG2GATC9AG13AGAG6TG1AG15AG22AG10AGAGAG14AG29AG3AG7CA20AG2AG1GA13AGAG5TC2AG3CT15AG22TC1AG7AGGA3AG1GA5AG25AG13TC8AG8AT5AG1AG10AG7AG10AG5GA5AG2TC11AG17AG8AG32AGAGAG4AG2AG13AG4AG6AG19CT4GAGA1GT4CT1AC26AG13CACT6AG21AGAG5TC5AG8AG8AG6AG7AG5AG1AG4AG3AG14AG4CT3AG20AGAG3AG12CT4AG10AG3C-T-2C-C-T-C-A-A-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-6AG9AG2TC1-G-G-G1AT3AGGA11TC14AC1AG11GA9CT13AG20AC17AG1AG1AG10AG5TC5AG31CA2AGGAAG7AG3AG2AG16AG1AGAG5AG2AG19AG5AT3GA3CT9TCAT1CTAG4CT9AG7GA30AG20CA2AG8CT13CT2TC8AG24AG7CT19AG6AG41AG2AG5AG3AGAG16AG28GA20TCGA1CT7AG2AG32AG9TC4AGAG3AG8AG1TA11TC3AGAG1CT19CA8AG5AG30AG9AG3AG42AGAG15TC14AGAG3AG4AG34GA3CT16GAACCA30AG15AG17AG4AG12GA2AG4AG5GA8AGAT6AGAGAG2TC19GA2CT11CT10AG4AG1GT41AG14AC2TC1AG27AGAG1AG10AG15TCGC2AGAG9GA1AG12GA7AG1AG11TC11GA44AG13TA9AG3CTAG12GT4GA15CA10AGAG1AGGC4TC2GA21AG16AG7AGGA13CT2AGAG8TC14GA11AG15TA10TC10AGAGAG3GA14GA1TC1AG11AG7AGAG7AG9TG16AG3CT3AG3AGAG8CT2CT22AG12AG12AG2AG23AGAG9TC1AGAG2TG1AC5CT1AG8AG11GA1CT3AG20AC3AC18AG5AG8CA3CT7CT5AG5AG2GACT28GA9AGAGGA21AC21GA12AG15AG4AG5CT7AGAG2GA5CA6AG5AGAG1AG10GA3AG5CT11AG6AG19AGAG6AT2AG8AT2CA3AG1AG16AGAG3AG11AG10AG6AG47AGAG6TC6AG1GA20TA8GA22AG4AG7AG21AG19GT11GA3AG4AG11CT3AC8CT5AG28AT9CA11AG2AGAC3AG2GT1AG11AG2AG3AGAGAG9AG6AG1TA25AG7AG7AG5TA18AG4AG4AG10AG66AGAG2AG10AG30AC5GA43AG11AG10GA9AG18TC15AGAG21CT35AG7AG7AGAG13AG31AG28TC11AG5AGAG6CT1AG1AGAG2AG1GTCT9CT2TC2CT4CG1AC28TC11AG1GA9AG16AGAG19AG12AG2CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT39AG3AG23AG19GA26AT1AC12AG7AG21AG9AGAG6TC9AG18AG10GAAT17CT5AGCACTAT5AC2ATAGAG1CT2AG1AG3TC17AGAGAG9AG2AG4AG27AC10TC2-T10AGAG5AGCA15AG2GATC2TGGA2AG2AG12AG13AC14AG23GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT11AG2AG9TC7TA2ACACGA3TG26GACT20AG1AT8GAGT4AG6AG27TC2AGAT5AG5AC3GT1AG28CT3-G-G-A-G3GT5GC1ACG-A-A-4CGAGGACG1C-1TG1TGAG2AG2AG2AGAG5GC9AGAG22GA1GA5TA4AGAG16AG11AGAG1GAAG2TA4ACTC11CT32AG13AG30TC8TA7AT4AGAT21TC4AG7AG10CA22AG6AG22CT6GA16CG6TG11AG2AG3AG5GAT-A-G-G-1AT1TC3ATCAAGAT1TG2TG1AGTGCGTACG5A-A-C-4AGCG1AGT-A-C-4AG1AG3AT1T-G-1CA20CG4GAAGGC7AG3AG4GAAG12CT17GA1CA2GA11AT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG3AG7AG8GA5ATGA2GA3TC7AG5AG9ACGA27AG7AG8GA21AG1TC2CT9AG2AG2AG5CA9ATAC8AG6AG6ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C2AGAG7AT2TGAT1GA3CT1AG2CA1G-A-T-5AG1GA4AG20CT3-A3ACCA1GA2TG3G-1GA9GACAAC1AG4TC1GAAGAC7AGGA3AC5AG4AT26AC3AG3AG4ACTC8AT19AG3AG18CTAT6GA18A-A-2G-7AT3AT1CG1-G2-C-T-G2CGAG1-T-C2CA5AC1AG2-G-G2TG-T-G-A-C-A-C-A5AC5GA20CA4GT7GA5AG22TC6AGAGGAACTA6GA2CT17AG2AGAC14AG2AG3CAAT1CGTC2TC1GA1AG1AGGTACAC4CT10AG3AG1AG2AG6AG8AG21CT17GA6AGAG19CA1AG4AG3AG21AG1AGAG3C-G-T-8AT7CTAG7AGAG2AG16AG8GC3CA10AG5AG29AG12CT6AG22AC18AGAG8AG15GA5TG4AG12CA1AG15AGAG6AGAG8AG20AG9AG4AG6AG3CT9T-A-1AT1TG1CA2TGCA1ATAT1-G-A2AC3TC5AG4CG3AG13CA1AC10AGGCAT5TC2ATAC4CA2AG12TA3AG2GAAG11AC10AG3CT5CA4AG4AG5AG5AG5GATC8AT5AG1AG10AT25AG3AG6AG4AG11TC25AG5CT11AG2GT7TA12AG2AGAG4AC12AG18AG1AG12GA8GTATAC9CATCAG3TC3AGCG4CT4AGAG5CT4AGAG11TC13AG3AG1AG18GACATC2AG2CT4CG2AC4AG4AG2AG1AGAG2AGAG2GAAGTC6GA2CT1AG2AG2GA6GA7AGAG1TG37AG3TC3TC2CA11AGAG1AG7AGAG12AGGT4AGAG1AGTC1AT1CT6TA3TG14AGGA8AG5AG4AG1GACT5AT4AG2AGAG9AG10TA2AG2GACT1AG3AG4GA6AGAG8A-G-A-A-A-3T-T-A-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-A-G-A-A-A-G-A-2AG17CA2AG3AGAG17TC1AG6TC2AG23TG2AG4TC16AG18AG2AG2AG2AG2CT10GC6AG26AG6TG2AG47TC1GC5GA11AT9TC5GA1TC14AC13GA3AG14AG12AT24TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG11AG7AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,598,8845,9441,1,598,0.0,659,88.629,530,plus,14TC1GC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA5AT24TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG11AG1GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,201,104,304,9487,9687,2.55e-74,278,98.010,197,plus,19GC21CT24GA78TC55 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,111,1,111,627,736,2.52e-31,135,92.793,103,plus,40TGAGGA8AG2AC45C-1AC3TG4 -MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9719,9078,150,9207,636,9627,0.0,9749,87.905,7980,plus,31AG41-A23CG21GA3TA38TG20CG3AG8AC3AG10TCAGCGCT9AGAG16GA17AG30CT2CT14GATA13CT2GA5TA2AG15GT50GATC9CT2AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC11AG8AGCG1ACTA24AG10AG28AG18CT8AG41AG1AG20GA11AG11TG2GA10AG7TG19CG22AG9AG20CT24AG3AG7CA28CT20AGAG1GACT4CT24GATC7TC14AG7AG10AG3TC11AG16AGGA2TC8GT8TG10AG18AG14TC14CT14AG8AG6TC32AG13CT41GT5CTTA7AGGA4AGGA12AG14AT28AG1AG10AG17AG6AG7AGAG6AG8AG23AG6C-1G-A-C-T-A-A-G-A-C-13AG7TC9CT15AG9CT26GA4CA14TC2AG2AT4GA5GA4TC15AC3AT4CA1AG15GA10AG20AC1ACAG1ACTA7AG5AG11AG47AG1AG11AG2AG16AGAGAGAG5AG2AG29GA3CT9TC30AG10GA2AT12AG16CT3CA2AG22CT2TC8AG21TC7AG3AG6GA36GA6AG11GA4AG2AG9AGAG7AT8AG7GA8TC44AG1AG16CA19AT10AGAG9CT2AG49AG5AG23TC5CTAG10AG23CT15GA6AGAGGA3AG25AG3AG4AG55GAGC31AG15AG18AG6CT14AG2AG17AG5AG5CT14GA12AG10TC4AG3AGAG24AG16CGAT9CA10AG27AGAG1AG2GA7AG6CT5CT2TC4AG11AG46GA72CTAG33GA11AG2ACGA2AG5AG44AGGA13CT3AG26GA24GA2CATC4GACG12AGAG22AG2TC8AG7AG1AG3TCGA9AG18AG11AGAG2AG5CT17AG3CT3AG28AG10TC9AG2AGAG9TC2AGAG11AG9AGGA8GTGA1CT3AG10GA6TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG6AG1TC2CT7AGAG2CA12AG6AG31AGAC1AG7AG1GA10CT5AG10AG8AT8AG16AG16AG52GA6TC11CG1TC6AG53AG5AG7AG21AG4CT18GC28CT3AC1CT19AG11TC9AT21AG1CTAG4AG4AGAG10AG2AG3AG1AGGA15AG1TA14TC9AG8AG13TAAG27AG48TC2TC51AG35CT14TA18AG22GA1AT71TC33CA4AG6AG58AG3CA21CT2AG5AGAG7CAAG1AG3AG1GT4CT19AC1AC6AG2CT22TC3AG3AT2AT13AC8AGAG32AG2CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC5AG8TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG7AG5AGGA2AG16CTCT12TC4CT2TC2-T10AG6AG9GA5ACAG3TC22AG17CATC9AG3AG14AG4TAGA10AC16CAGA24CT4CT7AGGC29AG19TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2GCAC5CT8CT2GC13GACT24TC6TA1AC10AG6TA11GA18AG5AC3GT33CA-G3GA1CACT1ATGC2GC1AC2AG1C-C-1CG1CGTA1-G-G-G-G9AG4TC1TA2TC5AGAG3AGGT1AG5AC8CT1-C-A-G1CA2CA4AG16AGAGAG8AG1AG3AG8TC38GT6AGATGA10AG3AC2CA25GA6GA7CT3AG1AT14CAAT10AG18GA28AG24GA3CT18CG6TG9A-A-2TG2AGTACA1AG1C-T-1GAC-C-4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5AGT-G-A-A-A-2AG8AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT9AG2GA2GA11GA1AT4G-T-A-A-A-A-A-T-A-4GCGA2A-A-A-6AT3TC2AG24AG21AG18TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT4CT18AG2AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT2GC2CT2AGCA1TA4AG2GA4AG8GA4AG11-G2AC2GA2TGA-4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA6CATG13AGAG8GA2AT2GA1TC3TC12AG3AG19AT7GA16AG1ATAT11AG1A-A-T-8TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGATAG1GA35GACT2GATC10AG1GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA3AG5AG9AG8AG7AG22CA6AG8AG2AG11CA1TG20AG1AGGA12AG1AGAG2CA1TA1AG6CG6AG7AGAG19AG8GC3GA10AG41AG14AG40AGAG22AG1GA8TG1AG14AG14AGAG6AGAGAG29AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AGAG2AC1AG7GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA1AG11AGAG4AG4GA4TA3CA1GT1AG3AG1AG10AT10AG6AG8AG2AG17AG2AG4GT13AG9AG5CT8GA2AG2GT7TA11AC3AG18AG3CT7AGGA4AG2AG3AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC13AG12AG4CTGAGA4AG5AG8AG8AGAGAG2AGAG5AC2GC2GA4AG2AG9GA7AG10AC13AT14CTAG7AC15AG9AGAGAG11TG5AG3GCCT1TG11TG11CG1CA16AG4AG1GACT13AG3AGAG5TG5GA3GTCATGCTAGAT1GACT1AG8GA1CTAG3AG3GA1AG3AG9A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-9AG3CA2AG3AGAG20AG3GA10CA1TC31AC1GTTG6CG12CG2AG2A-A-A-2AG5AGAG12GC18GA15AGGC4CG5AC22AG11TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC3AG3AG5TA18TG8AGGA12GA1GATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG1AG5GT3GCACAGCG1CG8AG2GACG35AG1AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 -MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9719,543,8665,9207,1,542,1.27e-164,578,87.293,474,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC3AG3AG5TA18TG5TG2AGGT7GA4GATCGATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG7GT3GCACAGCG1CG8AG2GACG37AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 -MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9719,151,1,150,781,631,2.96e-50,198,96.026,145,minus,22AT3CT21GC23-T41TC12AG23 -MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9719,9036,155,9136,649,9627,0.0,10637,91.479,8266,plus,18TGAGGA85-A-A-A49TA24ACAG27AG10GA57CT2CT5TG9AT4GA2AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC13ACGATC1CG2GACT20GT12CA31GA23GA20CT2TC8GA2AG23GA95GA42GA13AG50AG10CG11GA27CT32GA30TC9AG49GATCCT17AT2GA5TG26AG14AG41AG2AT35GA2GA14AG42AGAC2TC41CT35TC50GA68CA18CT38GA13TC5ATGA6GA7TC18GA1GA9GC11GA9AGAG40AG41CT97CTTC68CA6TC19TC20TC8AG12CA88AG8AG8GA95GA11AG41CT20GA6AG35AG11AG43TC85TC24GA38CT53AG11CTTC6AG7TC1GT11TC20CT8GT59CA5TC27CT7AG26TCGC13GA2AG19AGGA3GA7GA11GA4AC39GA2AG59GATA22GA50GA10CT7AG64GA14CT4GA9AG8GA2AG11TA2CA11AG23CT14CT32AG5AG8TC2TA14TC23TC37GACT14GA6TA31AGCT1GA10GA6AT11AG39CT7AC18ACGAGA12AT39GA6CT2TG77CA8GA23GT2GA16AG66TC11CT8GA10CT37TC88GA8AG11CT2CT2CT17GA8GA3GA10AT8AC1CG10AG12AG18AG2GA13GT3CA71AG35CA93CA19GA46AG4GA25AG2TC2TC141CA32CTAG5AGAG6CTCAAG29AGTC35GA74AG17CG3GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG59AC22CT5AG10GAAT25CTAT5TC8GA2AG33AG14TA31TC2-T15CT1AG16AG1CT43TC34GA3CG10AT14AG2CT34GC46CG3CA3AGGA18TCATCT5CT9GA7TC6TC4TC1CTTA2TCACTA3TG2AG23GACT4TA17GT8CA12AG11AG6GA1GA6TC15AC7TA2GA32TACAAT1GT-C2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC12AG13AG4AG2GA4CACA1GA1GT35GAAG7AC37AGGA8CT55AG5AT1AG1GT6AG6GA16GA3AG10TA38TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CG-C-G-G-G-A-G-A-A-T-G-A2CA1TG1GA-G-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG2AC1AG6GTCAGT3CT11AC5TA2GA2GCAC7GA1AT2G-A-A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT34TA21AG8GA13AC5GA5ACGA26GA19AG55AG1GA10AT4AT4AG6AG6AC13TC4GCGAAC1GT1CTAG2CG5TATACT4TC27TA2ACACAG3-C-C-A-G-A-G19TGATCT4CT4GA1T-A-T-7GA1CT2AG2GA21GA1-A-G-C3TA28CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT16GA8AG26CT5TC9TA2TCCA15CT3ATCT3AT1A-T-G-5GT1TG3TAGC-T1CA1-G-G3TA3GA1TC3CG1-A-G3-G2GATC1ACTA5AC4AC25CA8GAGA44AGCA3AT20GC1TA14GT2GT2GTGATGGC1TATC5AGAT1TC4CT3TC15AG6AG3TC37GA16AG19AG14AG5GA11AG3CA1GA6AT25CA20GC5AGGA9AT11GA1GT19AG42TC25TC18GA23CA16AG2AGCA35AG14CGGC7GA1T-G-G-G-C-A-3CT3ATAC3AG2TAGC1CG6GAGA1AC3TC18AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG28CA34GA5TA2CA1AT18AT69AG15CT11AG10TA7GA1TC9GC27GA17AG2GA7GAGT17TC3AG20AG35CA17GA1TCCG62GA5CT29CT11CTAG7TC4TC9AG12AG1AT6AG2TG5AG2AGTC1GT8TA3TG12GA17AG6GACT38AGGT1GA8ACAC1GA1AT2GA14A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-G-G-G-A-22GA17AC14TC8CA1TC8GC14TC7AC31G-A-T-19GC21CA8TC2AG6CG7GT39GA2TC9AG3GA41TC10GA25AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT23AG7CT3TA21CA12AG11ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G21CT22GC18-T56TG45 -MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9719,542,8609,9136,1,542,1.63e-174,610,89.852,487,plus,11GA2TC8ACAG3GA41TC10GA36CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT6GA16AG7CT3TA21CA24ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG21CT22GC18-T56TG45 -MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9719,9144,312,9387,577,9686,0.0,10905,92.104,8422,plus,25-G-A-C3-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23C-TA1TA2TG1AC2A-2GA1T-C-C-C-TG1TG3TGCGTGCATA1GC3TA2CA2C-C-G-AT4GC1T-A-2TGACGAAG5AG18AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25 -MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9719,654,8787,9414,1,645,0.0,705,88.532,579,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,9385,125,9411,380,9718,0.0,10753,90.581,8501,plus,41GC19CT1CT3TC53GA104AC10CT37CT11TGAGGA11AC37AG22CT12-A-A2TA62CA9AC7GA38GA44GA29GA8GA23GA8AG19AG8TA7AG5GATC3TC5CT2AG14TGGA20CT2AG1TC35GA27AC6GA4A-G-C-A-G-T-C-A-A-30CAATTC15TC7TCCA58CA2GA2AG80GA57TG10AG59GA39CA47AC4GA31TC30AG5TC8TC47AG62CT3CT10AG8AG38GA2GA6AG4CT2AG8CT22CT4G-G-T-GAGA1GT2AG3AC14AG19GA4AGCACT1AG32CATC3TC68CT2CTTA28AG12CT22CT2CT4AG41TC5AT10GA24CT18CT2CATA9AGAG29GA84AG60AG4CT40AG44AC31TC8AG20AG80AG56CA20GA2TC17GA17GA8AG14TC5GA59AG20CT8TC9AGGA6AG28CTTA14CA8GA50TC14GA11AG35CT17AG2CT22AG10GA5GA5AG1CG6GC1GA18TC19GA20TC11CT92AG26TCGC15AG21GA3GA1TC2GA14GA3AC26TC68GA28TC8CA44GA10CTAG29GA8AG5TG9GA7GA9GA12TC11GA1TC1AG8GA2AG22TCGA41CT1GA15AG47TC23TC2AG9ATAT22GA1CT8GA9AG2CA2TC41CT19AG65CTAC1GA50GA8CT3AG61AT12AG10GA20GA2AT2TA14TC10AG22AC1AG8GA11GA3AG31GA72AG16CT14GA2CT26GA20CT3AC1CT31TC9AT2TC5TC12AG1CTAG4AG2CT1AG9CT8AG2TAGA1TC8GA38GA124AG4TA17AG35CT56GA13GA14GC44AC2CA8AG100CT20AG5AGAG8AG7GT4CT5CT12AC48AG57CT37AG17GACA21AC4CT2TC5TC11AC12CA1AG3AT10TC1GT6TC5TG38GA6CT12TC4GA2GA34CTGA3GA29GA5TC14AG6TC11GA7AG19GAGT24GAATAT9AG7AG26CT14AG1GA15AT9TC1AG8TC19AGCA8GA6AG1-T3-C-G-A-C-A7AG14CA14GA2AG28GAGA3CG6AC21CT20CT4CT2AC3GA1GC31CA5AC5GA2CG3CA2GAAGGA9TC8TC1CT5CT4AG27TA2GCACGA3TGCT23TC1GACT22AT8CA2TA4GA17GA4AGGA11AG6AG5AC3GTTA32CA2GA2TACAAT1GTAC2AC1-C4CG-G2CA1CGTGTGAG-G12GA2TA10AG24-G-A2CA1-T37AG2TA17CT33AG44GA17CT3AT17AT3TC3GT1AG6AG7GA57CATACA9TC7CT1CG6TG9GTCTTG2CG1T-C-1CTCG1GTC-7ACTC1GA3A-G-A-2AGGT1AGGC1A-A-6AT1T-1CT1TA4G-G-A-G-A-C-9AG23GC1CGTCTA7GA2CA1AG4TGCTTG6CG2CTGA4CT10GA6GA1GAGA3AC7GA1G-A-C-1AG3AC2ACTC2TC4GA5TC19GA1CT8TC20TG5CT2TC38GA13ACAG22AC35AGAG2TA5GA5CT17TC17AG3AG1GA10ATAC9AG22GA8GC3CT5CG40GA2ACAC4GC-C-A-G-A-G-A13TC1AT2TGAT1GA3CT4CA1A-A-T-7GA4AG3AC10CT15GA9CAAC8GA7TC2CGACCA8AG1GA2GA1-T-T2-A-A-A-T4GA3CA11CGTCCA27GA1TC16AG23AT5AC4AG15CTCTA-C-G-14AGT-A-A-16GA8-G-G-A-A-G-T-G-A-C1TC6AC5GA18GA6GT7GA7CA24CAAGAT11TA27CT2GATCTA11AT1TA2AG2CA2GA4ATGCC-A-A-5CT60GA83GAC-T-G-6AT11CT34GC3GA5TC11AG6TA21AG12CT22GA35AG15CA4AG18CA16AG29CT9AG13CTAG15GA4TCATTG3GC1TG8CTAC3TC18AC1AG7GA11GA8TC2AT11AG7GA8GA4TAAG12CT5TGCA3GA5GA8CTCT16TC27AT26AG58CT8GA2AG2GT7CA2GT4GA4AG22AG2TC8GA9AG17ACGA1GT10CATC4TC3CG6TA13AG2AG25AG13AC11GATC4GA8AC49GA5CT12AC14AG1CT11CT8TC26AGAG1CT4GA10AG2AG4GT6TA2ACTG12GA17TG6GACT19AC2AG10AGGT4GT1GAGT10GA12AG5AGGA3AG16GTGA28CA3TC29CGACGT6CG3AC24AG5AG5AG2CT10GC3CT11GA26GA3AC1GT52AGGA29TC29AG2TC42GT6TA4-C4-A-C-C-A2-T1TA3CA1-A1CATA1TA1GATGGATA2CGTG1TCGAGA3CATG-G5TA1CA1-C-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA3AG1AT-G-G2CGTA1-C-C-G-G-A-G-A-G-A-G-A-A-G-T-G-T3C-5CA1CGCTCTGTAG4GCGCAG3-A1AC1ATGTCTGC1-T-C1AC2AG1ACAC1CG4GCAT1-C3TC-G-G-A-G-T-A2CTGC1CA1CA1GC-T-G-C-T3-A3-A7GA-C-A2CG1-A-C-T-T-T-C3ATCGAG1CG1-C-T-T-T-C-C2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,635,8840,9411,1,634,9.31e-121,432,76.535,486,plus,23ACAGGA29TC25GA3AG2TC18GA23GT6TA4-C4-A-C-C-A-GGT2TA3CA1-ATGCATA3-A1TAGATGGA1CGTC1TAGAGCTA2CGTG5TA1-A2-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA5-T-G-G-A-T-G-A-C-C-C-G-G-A-G-A-G-A-G2TGCTTGCT3C-5CA1CGCTCTGTAG4-C-C-G-C-C-T-A1GC1-T-T-T1CA1GC1-C1AT1-G-C-C3AG2-C1AGGC1AT2AG3GT1GCAT2TACATGCAGAACCT2AT1GAACCA3-A7-A-C-A-A-G-G2-C-T-T-T-C-C2-T1CG1CG2-TATGT1AC2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,255,125,379,9464,9718,5.83e-95,346,97.255,248,plus,41GC19CT1CT3TC53GA104AC10CT17 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,211,8973,9182,544,749,1.01e-65,249,92.417,195,plus,62AC10CT49TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,151,1,150,604,749,4.57e-39,161,88.742,134,plus,2AC10CT37CT11TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,91,8973,9063,9628,9718,9.52e-29,126,97.802,89,plus,62AC10CT17 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,9376,104,9441,402,9682,0.0,9757,86.775,8136,plus,19GC21CT24GA78TC55GA1TC1A-A-AT1CT1GA2C-2AGCTCGAT1A-2GA1CACT1ATGC37TGAGGA8AG2AC49AGAG22-A-A-A1TA11AG15AG4AG20GA3AG1AG12AC3AG3GA7AG10AG2AG15GA17AG8AG3AG43GA8AG3GA3TC1AG1AG25AG37CA10AG3AG7AG6TGGA13AG5GT8AGGA4AG26GA11GA12AG2AC4ACGAGACT3AGCT3TC7TA16CA1AC2AG8AG37AGAG17AG2AG17AG53TC14AGAG1TGAG4CT8TC15AG2GATC9AG13AGAG6TG1AG15AG22AG10AGAGAG14AG29AG3AG7CA20AG2AG1GA13AGAG5TC2AG3CT15AG22TC1AG7AGGA3AG1GA5AG25AG13TC8AG8AT5AG1AG10AG7AG10AG5GA5AG2TC11AG17AG8AG32AGAGAG4AG2AG13AG4AG6AG19CT4GAGA1GT4CT1AC26AG13CACT6AG21AGAG5TC5AG8AG8AG6AG7AG5AG1AG4AG3AG14AG4CT3AG20AGAG3AG12CT4AG10AG3C-T-2C-C-T-C-A-A-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-6AG9AG2TC1-G-G-G1AT3AGGA11TC14AC1AG11GA9CT13AG20AC17AG1AG1AG10AG5TC5AG31CA2AGGAAG7AG3AG2AG16AG1AGAG5AG2AG19AG5AT3GA3CT9TCAT1CTAG4CT9AG7GA30AG20CA2AG8CT13CT2TC8AG24AG7CT19AG6AG41AG2AG5AG3AGAG16AG28GA20TCGA1CT7AG2AG32AG9TC4AGAG3AG8AG1TA11TC3AGAG1CT19CA8AG5AG30AG9AG3AG42AGAG15TC14AGAG3AG4AG34GA3CT16GAACCA30AG15AG17AG4AG12GA2AG4AG5GA8AGAT6AGAGAG2TC19GA2CT11CT10AG4AG1GT41AG14AC2TC1AG27AGAG1AG10AG15TCGC2AGAG9GA1AG12GA7AG1AG11TC11GA44AG13TA9AG3CTAG12GT4GA15CA10AGAG1AGGC4TC2GA21AG16AG7AGGA13CT2AGAG8TC14GA11AG15TA10TC10AGAGAG3GA14GA1TC1AG11AG7AGAG7AG9TG16AG3CT3AG3AGAG8CT2CT22AG12AG12AG2AG23AGAG9TC1AGAG2TG1AC5CT1AG8AG11GA1CT3AG20AC3AC18AG5AG8CA3CT7CT5AG5AG2GACT28GA9AGAGGA21AC21GA12AG15AG4AG5CT7AGAG2GA5CA6AG5AGAG1AG10GA3AG5CT11AG6AG19AGAG6AT2AG8AT2CA3AG1AG16AGAG3AG11AG10AG6AG47AGAG6TC6AG1GA20TA8GA22AG4AG7AG21AG19GT11GA3AG4AG11CT3AC8CT5AG28AT9CA11AG2AGAC3AG2GT1AG11AG2AG3AGAGAG9AG6AG1TA25AG7AG7AG5TA18AG4AG4AG10AG66AGAG2AG10AG30AC5GA43AG11AG10GA9AG18TC15AGAG21CT35AG7AG7AGAG13AG31AG28TC11AG5AGAG6CT1AG1AGAG2AG1GTCT9CT2TC2CT4CG1AC28TC11AG1GA9AG16AGAG19AG12AG2CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT39AG3AG23AG19GA26AT1AC12AG7AG21AG9AGAG6TC9AG18AG10GAAT17CT5AGCACTAT5AC2ATAGAG1CT2AG1AG3TC17AGAGAG9AG2AG4AG27AC10TC12AGAG5AGCA15AG2GATC2TGGA2AG2AG12AG13AC14AG23GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT11AG2AG17TA2ACACGA3TG26GACT20AG1AT8GAGT4AG6AG27TC2AGAT5AG5AC3GT1AG28CT3-G-G-A-G3GT5GC1ACG-A-A-4CGAGGACG1C-1TG1TGAG2AG2AG2AGAG5GC9AGAG22GA1GA5TA4AGAG16AG11AGAG1GAAG2TA4ACTC11CT32AG13AG30TC8TA7AT4AGAT21TC4AG7AG10CA22AG6AG22CT6GA16CG6TG11AG2AG3AG5GAT-A-G-G-1AT1TC3ATCAAGAT1TG2TG1AGTGCGTACG5A-A-C-4AGCG1AGT-A-C-4AG1AG3AT1T-G-1CA20CG4GAAGGC7AG3AG4GAAG12CT17GA1CA2GA11AT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG3AG7AG8GA5ATGA2GA3TC7AG5AG9ACGA27AG7AG8GA21AG1TC2CT9AG2AG2AG5CA9ATAC8AG6AG6ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C2AGAG7AT2TGAT1GA3CT1AG2CA1G-A-T-5AG1GA4AG20CT3-A3ACCA1GA2TG3G-1GA9GACAAC1AG4TC1GAAGAC7AGGA3AC5AG4AT26AC3AG3AG4ACTC8AT19AG3AG18CTAT6GA18A-A-2G-7AT3AT1CG1-G2-C-T-G2CGAG1-T-C2CA5AC1AG2-G-G2TG-T-G-A-C-A-C-A5AC5GA20CA4GT7GA5AG22TC6AGAGGAACTA6GA2CT17AG2AGAC14AG2AG3CAAT1CGTC2TC1GA1AG1AGGTACAC4CT10AG3AG1AG2AG6AG8AG21CT17GA6AGAG19CA1AG4AG3AG21AG1AGAG3C-G-T-8AT7CTAG7AGAG2AG16AG8GC3CA10AG5AG29AG12CT6AG22AC18AGAG8AG15GA5TG4AG12CA1AG15AGAG6AGAG8AG20AG9AG4AG6AG3CT9T-A-1AT1TG1CA2TGCA1ATAT1-G-A2AC3TC5AG4CG3AG13CA1AC10AGGCAT5TC2ATAC4CA2AG12TA3AG2GAAG11AC10AG3CT5CA4AG4AG5AG5AG5GATC8AT5AG1AG10AT25AG3AG6AG4AG11TC25AG5CT11AG2GT7TA12AG2AGAG4AC12AG3TCAC13AG1AG12GA8GTATAC9CATCAG3TC3AGCG4CT4AGAG5CT4AGAG11TC13AG3AG1AG18GACATC2AG2CT4CG2AC4AG4AG2AG1AGAG2AGAG2GAAGTC6GA2CT1AG2AG2GA6GA7AGAG1TG37AG3TC3TC2CA11AGAG1AG7AGAG12AGGT4AGAG1AGTC1AT1CT6TA3TG14AGGA8AG5AG4AG1GACT5AT4AG2AGAG9AG10TA2AG2GACT1AG3AG4GA6AGAG8A-G-A-A-A-3T-T-A-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-A-G-A-A-A-G-A-2AG17CA2AG3AGAG17TC1AG6TC2AG23TG2AG4TC16AG18AG2AG2AG2AG2CT10GC6AG26AG6TG2AG47TC1GC5GA11AT9TC5GA1TC14AC17AG14AG12AT24TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG11AG7AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,598,8845,9441,1,598,0.0,659,88.629,530,plus,14TC1GC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA5AT24TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG11AG1GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,201,104,304,9486,9686,2.55e-74,278,98.010,197,plus,19GC21CT24GA78TC55 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,111,1,111,627,736,2.52e-31,135,92.793,103,plus,40TGAGGA8AG2AC45C-1AC3TG4 +MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9718,9077,150,9207,636,9626,0.0,9759,87.937,7982,plus,31AG41-A23CG21GA3TA38TG20CG3AG8AC3AG10TCAGCGCT9AGAG16GA17AG30CT2CT14GATA13CT2GA5TA2AG15GT50GATC9CT2AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC11AG8AGCG1ACTA24AG10AG28AG18CT8AG41AG1AG20GA11AG11TG2GA10AG7TG19CG22AG9AG20CT24AG3AG7CA28CT20AGAG1GACT4CT24GATC7TC14AG7AG10AG3TC11AG16AGGA2TC8GT8TG10AG18AG14TC14CT14AG8AG6TC32AG13CT41GT5CTTA7AGGA4AGGA12AG14AT28AG1AG10AG17AG6AG7AGAG6AG8AG23AG6C-1G-A-C-T-A-A-G-A-C-13AG7TC9CT15AG9CT26GA4CA14TC2AG2AT4GA5GA4TC15AC3AT4CA1AG15GA10AG20AC1ACAG1ACTA7AG5AG11AG47AG1AG11AG2AG16AGAGAGAG5AG2AG29GA3CT9TC30AG10GA2AT12AG16CT3CA2AG22CT2TC8AG21TC7AG3AG6GA36GA6AG11GA4AG2AG9AGAG7AT8AG7GA8TC44AG1AG16CA19AT10AGAG9CT2AG49AG5AG23TC5CTAG10AG23CT15GA6AGAGGA3AG25AG3AG4AG55GAGC31AG15AG18AG6CT14AG2AG17AG5AG5CT14GA12AG10TC4AG3AGAG24AG16CGAT9CA10AG27AGAG1AG2GA7AG6CT5CT2TC4AG11AG46GA72CTAG33GA11AG2ACGA2AG5AG44AGGA13CT3AG26GA24GA2CATC4GACG12AGAG22AG2TC8AG7AG1AG3TCGA9AG18AG11AGAG2AG5CT17AG3CT3AG28AG10TC9AG2AGAG9TC2AGAG11AG9AGGA8GTGA1CT3AG10GA6TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG6AG1TC2CT7AGAG2CA12AG6AG31AGAC1AG7AG1GA10CT5AG10AG8AT8AG16AG16AG52GA6TC11CG1TC6AG53AG5AG7AG21AG4CT18GC28CT3AC1CT19AG11TC9AT21AG1CTAG4AG4AGAG10AG2AG3AG1AGGA15AG1TA14TC9AG8AG13TAAG27AG48TC2TC51AG35CT14TA18AG22GA1AT71TC33CA4AG6AG58AG3CA21CT2AG5AGAG7CAAG1AG3AG1GT4CT19AC1AC6AG2CT22TC3AG3AT2AT13AC8AGAG32AG2CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC5AG8TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG7AG5AGGA2AG16CTCT12TC4CT2TC12AG6AG9GA5ACAG3TC22AG17CATC9AG3AG14AG4TAGA10AC16CAGA24CT4CT7AGGC29AG19TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2GCAC5CT8CT2GC13GACT24TC6TA1AC10AG6TA11GA18AG5AC3GT33CA-G3GA1CACT1ATGC2GC1AC2AG1C-C-1CG1CGTA1-G-G-G-G9AG4TC1TA2TC5AGAG3AGGT1AG5AC8CT1-C-A-G1CA2CA4AG16AGAGAG8AG1AG3AG8TC38GT6AGATGA10AG3AC2CA25GA6GA7CT3AG1AT14CAAT10AG18GA28AG24GA3CT18CG6TG9A-A-2TG2AGTACA1AG1C-T-1GAC-C-4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5AGT-G-A-A-A-2AG8AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT9AG2GA2GA11GA1AT4G-T-A-A-A-A-A-T-A-4GCGA2A-A-A-6AT3TC2AG24AG21AG18TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT4CT18AG2AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT2GC2CT2AGCA1TA4AG2GA4AG8GA4AG11-G2AC2GA2TGA-4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA6CATG13AGAG8GA2AT2GA1TC3TC12AG3AG19AT7GA16AG1ATAT11AG1A-A-T-8TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGATAG1GA35GACT2GATC10AG1GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA3AG5AG9AG8AG7AG22CA6AG8AG2AG11CA1TG20AG1AGGA12AG1AGAG2CA1TA1AG6CG6AG7AGAG19AG8GC3GA10AG41AG14AG40AGAG22AG1GA8TG1AG14AG14AGAG6AGAGAG29AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AGAG2AC1AG7GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA1AG11AGAG4AG4GA4TA3CA1GT1AG3AG1AG10AT10AG6AG8AG2AG17AG2AG4GT13AG9AG5CT8GA2AG2GT7TA11AC3AG18AG4AC6AGGA4AG2AG3AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC13AG12AG4CTGAGA4AG5AG8AG8AGAGAG2AGAG5AC2GC2GA4AG2AG9GA7AG10AC13AT14CTAG7AC15AG9AGAGAG11TG5AG3GCCT1TG11TG11CG1CA16AG4AG1GACT13AG3AGAG5TG5GA3GTCATGCTAGAT1GACT1AG8GA1CTAG3AG3GA1AG3AG9A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-9AG3CA2AG3AGAG20AG3GA10CA1TC31AC1GTTG6CG12CG2AG2A-A-A-2AG5AGAG12GC18GA15AGGC4CG5AC22AG11TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC3AG3AG5TA18TG8AGGA12GA1GATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG1AG5GT3GCACAGCG1CG8AG2GACG35AG1AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 +MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9718,543,8665,9207,1,542,1.27e-164,578,87.293,474,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC3AG3AG5TA18TG5TG2AGGT7GA4GATCGATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG7GT3GCACAGCG1CG8AG2GACG37AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 +MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9718,151,1,150,781,631,2.96e-50,198,96.026,145,minus,22AT3CT21GC23-T41TC12AG23 +MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9718,9035,155,9136,649,9626,0.0,10641,91.489,8266,plus,18TGAGGA85-A-A-A49TA24ACAG27AG10GA57CT2CT5TG9AT4GA2AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC13ACGATC1CG2GACT20GT12CA31GA23GA20CT2TC8GA2AG23GA95GA42GA13AG50AG10CG11GA27CT32GA30TC9AG49GATCCT17AT2GA5TG26AG14AG41AG2AT35GA2GA14AG42AGAC2TC41CT35TC50GA68CA18CT38GA13TC5ATGA6GA7TC18GA1GA9GC11GA9AGAG40AG41CT97CTTC68CA6TC19TC20TC8AG12CA88AG8AG8GA95GA11AG41CT20GA6AG35AG11AG43TC85TC24GA38CT53AG11CTTC6AG7TC1GT11TC20CT8GT59CA5TC27CT7AG26TCGC13GA2AG19AGGA3GA7GA11GA4AC39GA2AG59GATA22GA50GA10CT7AG64GA14CT4GA9AG8GA2AG11TA2CA11AG23CT14CT32AG5AG8TC2TA14TC23TC37GACT14GA6TA31AGCT1GA10GA6AT11AG39CT7AC18ACGAGA12AT39GA6CT2TG77CA8GA23GT2GA16AG66TC11CT8GA10CT37TC88GA8AG11CT2CT2CT17GA8GA3GA10AT8AC1CG10AG12AG18AG2GA13GT3CA71AG35CA93CA19GA46AG4GA25AG2TC2TC141CA32CTAG5AGAG6CTCAAG29AGTC35GA74AG17CG3GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG59AC22CT5AG10GAAT25CTAT5TC8GA2AG33AG14TA31TC17CT1AG16AG1CT43TC34GA3CG10AT14AG2CT34GC46CG3CA3AGGA18TCATCT5CT9GA7TC11TC1CTTA2TCACTA3TG2AG23GACT4TA17GT8CA12AG11AG6GA1GA6TC15AC7TA2GA32TACAAT1GT-C2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC12AG13AG4AG2GA4CACA1GA1GT35GAAG7AC37AGGA8CT55AG5AT1AG1GT6AG6GA16GA3AG10TA38TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CG-C-G-G-G-A-G-A-A-T-G-A2CA1TG1GA-G-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG2AC1AG6GTCAGT3CT11AC5TA2GA2GCAC7GA1AT2G-A-A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT34TA21AG8GA13AC5GA5ACGA26GA19AG55AG1GA10AT4AT4AG6AG6AC13TC4GCGAAC1GT1CTAG2CG5TATACT4TC27TA2ACACAG3-C-C-A-G-A-G19TGATCT4CT4GA1T-A-T-7GA1CT2AG2GA21GA1-A-G-C3TA28CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT16GA8AG26CT5TC9TA2TCCA15CT3ATCT3AT1A-T-G-5GT1TG3TAGC-T1CA1-G-G3TA3GA1TC3CG1-A-G3-G2GATC1ACTA5AC4AC25CA8GAGA44AGCA3AT20GC1TA14GT2GT2GTGATGGC1TATC5AGAT1TC4CT3TC15AG6AG3TC37GA16AG19AG14AG5GA11AG3CA1GA6AT25CA20GC5AGGA9AT11GA1GT19AG42TC25TC18GA23CA16AG2AGCA35AG14CGGC7GA1T-G-G-G-C-A-3CT3ATAC3AG2TAGC1CG6GAGA1AC3TC18AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG28CA34GA5TA2CA1AT18AT69AG15CT11AG10TA7GA1TC9GC18TCAC7GA17AG2GA7GAGT17TC3AG20AG35CA17GA1TCCG62GA5CT29CT11CTAG7TC4TC9AG12AG1AT6AG2TG5AG2AGTC1GT8TA3TG12GA17AG6GACT38AGGT1GA8ACAC1GA1AT2GA14A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-G-G-G-A-22GA17AC14TC8CA1TC8GC14TC7AC31G-A-T-19GC21CA8TC2AG6CG7GT39GA2TC9AG3GA41TC36AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT23AG7CT3TA21CA12AG11ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G21CT22GC18-T56TG45 +MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9718,542,8609,9136,1,542,1.63e-174,610,89.852,487,plus,11GA2TC8ACAG3GA41TC10GA36CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT6GA16AG7CT3TA21CA24ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG21CT22GC18-T56TG45 +MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9718,9143,312,9387,577,9685,0.0,10915,92.136,8424,plus,25-G-A-C3-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23C-TA1TA2TG1AC2A-2GA1T-C-C-C-TG1TG3TGCGTGCATA1GC3TA2CA2C-C-G-AT4GC1T-A-2TGACGAAG5AG18AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25 +MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9718,654,8787,9414,1,645,0.0,705,88.532,579,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23 MK116110.1,Ref.B.TH.90.BK132.AY173951,0,8967,8996,7800,1191,8938,1230,8996,0.0,8979,90.526,7061,plus,2CG17-G-A-C7AG5GA33AGGA4CT15CT5TC3AGTA6TC5ACACAG15CT4GAAG13AG7CA13GA13GC3GA24CA19GA14CT20AG13ACGA27GA8CT14CA1GA7GA10TC1CT3GA2TG34TA7AGGA37AG27TAGA11AG65CTCTAG9AG24GA3GA47AC4GT17CT11CT16GA28AG76GA8GA30AG55GA11GA11TC17GA8GA11AG2AG20AG35AC14TC5GA20CG3GATC79GTCG15TC14GA2GA14GA5TC18CT1AG3AG13GA3TA4AG8GA29AG11GA14CT2GA2GA23CT8GT32GA6AGCTAG5AG41AG8AG20TCGC15GA21AG9TG27GA46CA1GA32CT12TA4AG8AG8GA5TA5GA11AG14GA11GA11AG1AG4AG29CG4TA41AG11TC1GA63CT17TC17AG20GA5CG20AC8CA8AG2CT2TC5TG26TG3GA4GA12AG5CT22GA21TC8CT10AG4CT9CT6TA10GA6AT7TCCA19GA12TA6AG22AC10AG9AG7GA11AG57TC4CTTC28AG5GA50CTAG41TC16AG8AG44GA32GA14TA44TC3AC31CA26CT5TC2CT3GA7AG2CT14AG23TC38GA35GA5AG14GA23CT33AG31GA6TA10AG95CT2CG35CT5AC41CT36GA20TAGA10CT8GA9CT9GA5TC1GA2AG5GT1TG4AG10GC4TC1CT1AC25CT11GA2TG5AC2AGAGAT5CAAG32CA11CT2GA20AG3AGAGGA2CA5TC14TA1AGACGC16CT44AT6GT9GT48CT15TC2GA8GATG2AC1TC4AG4CT18CT4CG3GA5GA25GA11GA5GA2AG5TC9GA27GAAT14TC2CT7TC6TC2GCAG1CA5AG5CTGA9CA9TC6AG10AG15TC8AC7CT11AG10AG20TC2GT2GA1GA5AG20CT5CA4CA12CT20TG7CA2AC15GA2CT5AT28GC46CG7AGAGGA1AC2AC2GA8AGAC1CT5CT14AGCT6CA5AC5GA6GTGT2CG20GC1AGCG24TC6CA30AG9TC2AGAT4AT9GA40CT8GA2AG8GT5AG1GT7GCAT10AG2GA8CTTA11AGCA36AG5GA53GA20GA17GA21TG6GT13GA7TYGACTAG4AC11TC3GA38CTTC22CT5TC7TC3GACA11GT1CG1AGCA7-C-T-A-A-T-A-C-C-A-A-T-A-G-T-A-C-C-G-C-C-G-A-G7-A1AGTC2CA7CA1AG28AGAC4CGAG6GT1AG33GA17A-A-G-6G-A-T-2T-A-G-C-T-T-T-A-A-T-A-A-T-A-A-33TC5AC5TC38CT3AG12AT3AG7GA6CTAG2GA3CAAG11AC2GA7CA10TA2AG21GA9GA15TC17AG2CG1GA18CG7CTTA1GA7TC24GAAGCACA6AG7CT8GA2CT2TC3AT7AG5TA3CAAC1GACTAG10AG4ATTA4GA30AG9CT9-A3G-2GA1GA6GA1TC19CA7CA11GAGAGC5AT11CT2TGCA4GC25CTAG10AT18TC1AT13CA24AGTC1AC2GATAAGCGTA3-G2TGTAGT1AG1TG2TG1CA2GAT-17TC1AG5GAGA21AG22TC9CG1TA10AG3TCTA1AC35TA6GC1GA1GA2AG2GC1-A-A-C-G-A-G-A-C-T4CT12CA6GA26TC21GA16CG50AG1AG4CT1C-T-G-27AG29AG22GA1AT21GA19AG48TC2AG18CT1GA18CA46TC35CT12AG4AG6GA17GC1GA7AG8GATC9CGAGAC11TC17GA1GA3GA16AT3AT3TC2GCCA1CT7GA4ACCA2CT7GA7AGGATC8AC41CA2AGAG4GT9GA22AG5AG14TC8GA2AG10GA1TC30AG15CA22GC4AGCG9AGAGCACT9CG2CA9AT3CT3AC3GA47CT1GA24AG13AGTC7CT9GA9AG20AG2AT57AG11GT9CT2GA13CA8GATC4CA1AC5AG5AG5AG19GA15GTTG4T-2T-T-G-G-A-23AG5-A-A-C-T-A-A-G-C-C5GA12AT2GA10TC4CA10CA22AG7CG7TC7CA30-G-G-G12TC5TC1GAGA5AG33TC1GA42AC1GA2AT8GA35CT29CT11AG11GA2TC26AG9CG5AC4GCCA9CA5CA2GA3AG2GA21TA3AG15TA10GA6AGCT20AC4AG5TG7GTAG3ACAG4CATA18AG11CT1AG2TC3AC30G-24-G37CT5CT-T33TA22GA2GA45AC26 MK116110.1,Ref.B.TH.90.BK132.AY173951,0,8967,8996,1137,58,1194,1219,86,0.0,1395,92.964,1057,minus,2TC11TA2CT83TC41AC8AG17GA2TC48TC17AGCT3AG8TC28CT9AG2GA2AT5TC19TG48AG23TC13CT66TC8TG23AG16TA23CA15AG17AG50CT26GC1GTGA17GA8GA9TC1AG3CT3CT1CTCT18TC2CTAT4GA11CT14AC4GACA3CT12GT2TC7CT9TC12CT4CT16TC4CT8CT5TC2GA3GCAT3CT41TC2CT49GT9CT17TC7TG12TC6TCGTGA7TG57GTTC4A-C-T-25 MK116110.1,Ref.B.TH.90.BK132.AY173951,0,8967,8996,57,1,57,4,60,1.43e-11,69.7,91.228,52,plus,14TAAGGA8AG2TC28 -MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9719,9071,480,9481,576,9625,0.0,10861,92.239,8367,plus,26-G-A-C-C-C-T-T2-A-G-T-C-A-G-T-G-T-G-G-A15C-3A-1ACTC2G-G-C-TA1GA1TGAG2TCAT2GA1TG1CGTACA2TGAG2TA17GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9719,542,8949,9481,1,540,8.48e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9719,9035,70,9055,648,9621,0.0,10441,90.747,8199,plus,19AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA69GATC9CT2AG12AG1TGGA20CT6CAAG11AG20GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG13CA23GAAG28AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC8TC20GA2TC8GT8TG59CT14AG8AG6TC31GA2GA11CT47CTTA8GACT3AGGA21AG2GA2AT30AG4TC50GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA21GA10AG20AC1ACAG1ACTA6GAAG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA27CA8GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTCG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA20CA7CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA30CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC1CA26CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA25AGGACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT24GA23CT15TC2AG21GA2GT9CT5CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA20CT12TC4CT2TC2-T17AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CTCA7GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2ACAC5CT11GC14CT24TC6TA1AC17TA11GA24AC3GT27AG5CA5CACA-T1GTGC2GC1AC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT4AGAT14CAAT29GA53GA3CT18CG6TG9A-G-2TG3-A-A-T-G-A2AC6TC3TAAG2AG1-A-G-C-G-G-G-A-G-A-A-T-G4CT3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT4GA7GA2GA2TC8GA1AT4G-T-G-G-A-A-A-T-A-4GCGA2A-A-A-4GA1AT3TC2AG24AG12AG27TA30GA4GAATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC1CT5AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG19TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA11ACA-6TC2TGAC7AG4AC6-G-A-A1GT12GA7TG23GA2AT2GA1TC3TC36AT7GA18-T-T-T3GA5-T-G2TGAT1TC2G-2TG3-C-A-A-A-T-A-A-C6TGCG2AG1AG4TA5AC30TA8GA9GA12TC9CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CTAC5GA59CA18AG11CA1TG20AG2GA18CA1TA8CG44GC3GA52AG14AG66GA8CG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8GT1CG7AC1AGGA6GA11GAAG1ATCT4TC1TCATAC10CGTA3AG2GA5AG6CA13CA7CA9GA16GA7GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC26CT8GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11CG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA10TA5GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG3TG5AG5GT3GCACAGCG1CG8AG2GACG16TC18AG22AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 -MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9719,537,8519,9055,1,536,6.00e-175,612,89.944,483,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG3TG11GT3GCACAGCG1CG8AG2GACG16TC41AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 -MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9719,9023,565,9537,623,9625,0.0,10895,92.563,8352,plus,26A-C-T-C-TG4T-13TGAG20GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9719,542,9005,9537,1,540,6.18e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9719,28,370,397,622,649,0.002,42.5,100.000,28,plus,28 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,8984,200,9165,768,9676,0.0,10431,90.895,8166,plus,51CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC9CT2AG4CA7AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG2TA35AG28AG18CT73GA11AG10CATG2GA18TG19CG23GA29CT36CA25TA2CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA24GA2AT30AG10AG44GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG65CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC63CA19AT21CT52AG29TC5CTAG10AG23CT15GA7AGGA94GAGC55TC10AG6CT17AG18GA10CT38TC51CGAT9CA15AG25AG2GA14CT2AG2CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG47TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA2TA3CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGGC9AG12CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC110TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA19CTCT12TC4CT2TC2-T17AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2GA2CACA-T1GTGC2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-2TG2AGT-C-T-A-3CGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11GA1AT1G-T-A-G-T-G-G-A-A-7GCGA2A-A-A-4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA7GA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT14A-T-G-7CAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG1AG3CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC1CT8CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC26CT8GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT12CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1AT2AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,592,8574,9165,1,591,0.0,690,90.878,538,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1AT2AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,129,1,128,778,650,1.18e-41,169,96.124,124,minus,19AT3CT21GC23-T41TC17 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,72,130,201,623,694,1.90e-21,102,98.611,71,plus,44AG27 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,48,9167,9214,463,510,5.46e-12,71.1,100.000,48,plus,48 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,48,9167,9214,9548,9595,5.46e-12,71.1,100.000,48,plus,48 -MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9719,9068,648,9663,640,9643,0.0,10103,89.314,8099,plus,27TGAGGA62AG22-A-A-A13AG20AGAG13TA24ACAG27AG10GA57CT2CT5TG9AT7AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC8AC4ACGATC1CG2GACT20GT12CA31GA19AG3GA20CT2TC8GA2AG23GA95GA10AGAG30GA75CG2AG8GA27CT20AG11GA30TC9AG49GATCCT17AT8TG10AG15AG2AG11AG32AGAG7AG2AT35GA17AG42AGAC2TC41CT28AG6TC100AG18CA3AG9AG4CT52TC1AG3ATGA6GA7TC18GA1GA5AG3GC11GA9AGAG40AG5GA35CT17AG16AG17AGAG11CT30ACCTTC68CA6TC14AG4TC20TC8AG12CA7AG8AG3AG67AG8AG3AGAGAG2GA12AG61AG19AGGA11AG16AGAG12AG10CT6AG13GA6AG10AG5AG18AG11AG9AG33TC3AG9AG35AG4AG30TC24GA32AG5CT9AG17AG25AG11CTTC6AG2AG1AG2TC1GT11TC20CT8GT5AGAG52CA5TC27CT4AGAG1AG11AG14TCGC3AG9GA2AG19AG4GA7GA11GA4AC38AG3AG22AG36GATA11AG10GA50GA10CT3AG3AG64GA5AG8CT4GA9AG8GA2AG7AGAG2TA2CA1AG9AG16AG6CT4AGAG8CT25AG6AG5AG5GA2TC2TA14TC12AG10TC1AGAG12AG21GACT14GA6TA31AGCT1GA10GA6AT11AG39CT2AG4AC18AC1GA12AT46CT2TG4AG16AG5AG2AG32AG13CA12AG19AT2GA3AG12AG5AGAG45AG13TC11CT9AGAG8CT4AG20AG11TC34AG21AG31GA8AG11CT2CT2CT17GA1AG6GA3GA10AT8AC1CG10AG12AG11AG2AG3AGAGAGGA13GT3CA25AG45AG35CA93CA19GA46AG4GA25AG2TC2TC79AG61CA32CTAG5AGAG6CTCAAGAG28AGTC35GA34AG33AG5AG19AG1GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG51AG7AC22CT5AG10GAAT25CTAT5TC11AG22AG10AG7AG1GA4TA31TC2-T10AG4CT1AG16AG1CT24AG18TC34GA3CG10AT14AG2CT25CT8GC46CG3CA3AGGA18TCATCT5CT9GA7TC6TC4TC2TA2TCACTA3TG2AG23GACT4TA15AG1GT8CA12AG11AG6GA1GA6TC15AC7TA1AGGA32TACAAT1GT-C2GC1GC2AG1CGAGGACG2TGTG-G-G2AG5AG5TC10AG1AG13AG4AG2GA4CACA1GA1GT19AGAG14GAAG7AC37AGGA8CT11AG43AG5AT1AG1AT6AG6GA16GA3AG10TA28AG9TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CGTCTGCGTG1-G-A2AGCA2CA1TG-G2-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG1AGAC1AG6GTCAGT3CT11AC5TA2GA2GCAC7G-A-2AT2A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT15AG18TA13AG7AG8GA13AC5GA5AC27GA12AG6AG55AG1GA10AT4AT4AG6AG6AC13TC4ACGAAC1GT1CTAG2CGGA4TATACT4TC27TA2ACACAG3-C-C-A-G-A-G1AG7AG9TGAT5CT4GA1T-A-T-4AG2GA1CT2AG2GA21GA1-A-G-C3TA4GA23CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT5AGAG9GA8AG18AGAG1AG4CT5TC9TA2TCCA15CT1AG1ATCT3AT1A-T-G-5GTAGTG3TAGC-T1CA1-G-G3TA3GA1TC3CG1GAAGAGTA3AG1TC-A-C-A5AC4AC25CA8GA5AG29AG9AGCA3AT19AGGC1TA12AG1GTAG1GT3-A1AC3TA1-T-G-A-G-T-C-C-G3CT3TC9AG3AG1AG6AG3TC12AG24GA13AG2AG19AG20GA11AGAG2CA8AT8AGAG6AG8CAAG10AG8GC2GA2AGGA9AT11GA1GT1CA17AG20AG21TC18AGAG5TC18GA10AG12CA16AG2AGCA4AG9AG20AG9AG4CGGC6AGGA3G-G-C-4C-A-A-A-A-2TCA-C-A-A-A-A-G-3AG2TAGC1CG4AG1GA2AC3TC5AG3AG4AG3AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG3AG24CA11AG11AG5AG4GA5TA2CA1AT18AT25AG3AG39AG9AG5CT11AG10TA7GA7AG3GC14AG11AGGA4AG12AG2GA7GAGT17TC3AG10AG9AG8AG26CA17GA1TCCG1AG15AGAG6AG1AG3AGAG16AG2AG9GA5CT1AG27CT11CTAG7TC4TC9AGAG9AG1AG1AT6AG2TG5AG2AGTC1AT8TA3TG12GA17AG4AG1GACT13AG24AGAT1GA2AGAG2AG1ACAC1GA1AT2GA1AGAG8AG2A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-A-A-G-A-23AG3AGAG11AC7AG6TC8CA1TC7AGGC14TC7AC24AG6G-A-T-5AG13GC7TG13CA8TC2AG6CG7GT39GA2TC9AG3GA41TC10GA22AG2AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT4AG18AG7CT3TA6AG14CA12AG11ACAT11TA2AT3AGGA11AC6TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 -MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9719,558,9120,9663,1,558,4.74e-171,599,87.993,491,plus,11GA2TC8ACAG3GA41TC10GA22AG13CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT4AG1GA16AG7CT3TA6AG14CA24ACAT11TA2AT3AGGA11AC6TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 -MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9719,9071,541,9544,577,9625,0.0,10835,92.129,8357,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG1AC2A-2GA1TG1CGCATA1CGTGCGCA2TC1TACG2CG10GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9719,542,9012,9544,1,540,3.24e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9719,8890,661,9500,755,9626,0.0,10711,92.463,8220,plus,3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG81A-T-G-G-G-21AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC13GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 -MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9719,544,8966,9500,1,541,1.71e-174,610,89.890,489,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 -MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9719,99,9492,9589,4443,4345,9.70e-29,126,94.949,94,minus,4GT7GA36AG20CT9-A18 -MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9719,9088,581,9617,577,9627,0.0,10868,92.221,8381,plus,26-A1TC2ATGTCT3GCGACGGTCGCTCG3C-A-G-21G-G-A-C-T-C-T-G-G-T-3T-2AG2T-3C-A-C-TG3TG1T-A-1CA1GATG2CAGACA1GC7A-8GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9719,544,9083,9617,1,542,1.19e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9719,9069,479,9485,577,9625,0.0,10895,92.370,8377,plus,25A-C-TG1ACACTCCT1CT3-T5CT1C-C-C-3CA1G-G-G-AT40TGAG20GA29AG20-A-C-T-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2GT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA24GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA29TC5TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTTA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA13GT4AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 -MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9719,542,8953,9485,1,540,6.15e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 -MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9719,9072,349,9353,577,9625,0.0,10877,92.284,8372,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG2TCAT2G-1TACG1CGTACA1AGAGTGCA19GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9719,542,8821,9353,1,540,8.37e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,8943,204,9098,747,9608,0.0,10376,90.876,8127,plus,2GT2TG1AC15TC48CG2CA8CTACAG27AG4GA4CAGA45CA8CT2CT29CT1AG7AC7AG2CA6GT50GATC12AG5GA8TGGA4GA2TC5AG14AG32GAAG14G-C-C-12AC3AG2GACT2AG17CT14GC5AG26CT5CTCT20AG13AT14AG18CT7GA92GA32GT5AG3GA16AG2GA55CG10CA10CTGA16CT18TC5CT16GA12GATC7TC58GA11TC17AG6GAGA51CT22GCAG38GA9AG13GA8AT16CT4GAGA1GT2CGAC1GA27AG14CT9CT23TC1TC29GA42CT2CT29AG12CT13GA8CT35G-G-A-G-A-G-C-C-T-C-A-G-G-C-C-A-A-C-A-G-C-C-C-C-A-C-C-A-G-T-14TC5AT7GA2GA1CT3TCTC12AG4GT9GAAC3CA3CT3GA9AGAG19ACGC1AC24AC19CT33GACGGT75GCCT9TC14AT2TA32TC17AG38TC8AG14GA27AG58AG14AG14AT27AG31GA80TC5AG18AG25CA26AC32CT81TA16AC29AC23CT56AG2AG3GCGA11AG6GATC28GA43GA19AGAT9GA5AC1TG33AG8CT23AG10AGAG20GA12TC58AG39AT7AC23AG11GA56GA53GA6TA1TC44AG25TC12CG40GA3TC6CT4AG66TG4TC30AG5GA1CT14GA13AC9CA5AG5AT15CTTA6AT11AG10CT9GA45AC21GA34AG4CT3AG16TC20GA21AG4GA2TC9TC21GA9AT2GA7GA36CT68TC12AG25GA14CT12AG82CT3AC1CT41AT21AG2AG1CT2AG4AG21GAGA16TA17GA11GA32AT11CA50TC59TC45TA13CT27GA28TC20GA11GA41AG17CA60CA30AGAG4AG3AG27GA3AC9AG37GAAGGA6GA17TC4GTCA4GA5GA38AG3GAGA9AC5CA2GA6AG1CA24CT10TC11AC12CA1TG3AT10TC1GT54GA22GT1GA37TG5AG53TC28AG2AG6CA1GT11GA12CACTAT5TC3AG11TC34GA20GT20TC2-T17AG16AG3TCCT1CG22TG13AGCA35GA10AC25CT21CT1CAGC5GC35GA1AC5GA2TG3TA1AC1AGGAGA1CA5GA9ACCT31TC1TCTA1TC2TA1A-G-A-1GCTC13AGCT16GAGT22AT8CA1TC40AG1AT2CA8AC3GT33G-G-G-G-G-A-T-C-3A-4TA1GA5GA14-G-G-T1CG1CG1ATTG1CGTG18AG2AG5TCAT3AG10CA34AG5AG8AC11CT90AG1GA5AGAG46TA2AG5AT5CT3GA4CT52CGCT5TG6AG5A-C-C-A-T-T-G-A-G-C-C-A-2CG4CA6ATGA6TG4-A-G-C5-A-A-T1TA2GAAT2GA9AG2GA1CA16GA3CG7CA6AG4AGGT1AC14CT1CT15GA2GA2GC3CT2GA1GA1ATAG3AC2AC5TA2GA5TC9TC7ATGC26AC5AG47GA6GA4AG1AC16ACAC5ACCA10TC82GA9CT7TA1AG6AG4GA22AC1AT6TA33-A-A-AGA4-T-C-C4AC2TG1TG2CG16TGAT1GA3CT4G-A-T-1TA7GA4AG3AC21AG2AC1GA1TA7CA9CA3GA1GA4AGAC6CAAG11-G-A-A1GT3GACA7GAAT6AG1CA29TC40AT4GAGC4AG3TACA1TA1GT1-CAT2CG1ATCT2CT1AGAT3-T-G1TATG4T-G-3TG1CG1A-6GA2AC1AG1TA3-A-G-T-G-A-C2CA4TCAC8TC29AGGA1GA29TCCA19GA14AG23GT1CA2A-C-1GCGA3GAGT2A-C-A-G-1ATACTC4CT15GA3AG6AG30CT9GA5AG65AGCGCA9AT14CT4GA26AC3CA46AG12CT10GT11GA32AC2AG15GA16GA7GAAG26CT17CT9AG14AGTC14GA1AT5AG1TAAC1CG6GA1CTAC1TCTATC3TC6CG7TC1CG20AG1ATAT4TC2CTACAC3CA4GA3GT4GA8GA43AG16GA5TA4CT11CT6AT8TA1AG14AGAG20AG37CT22GA1TC5GATC29CTCA36GAATCTAC15TC4AG12TA7AC94AC18GC4GA2AG41AC16TC22AG8TG3CT4AG2AGTC9-T-A-T-T-C-G-C-C-A-C-A-T-A-C-C-T-A-G-A18AG5CA33CAAG4AGAT2GT2AG4GC2GAAC16GACG2AG1AG5GC11GA12TC9TC7GA31AG3AC15TC43AC9GA5GA11CT7GC4TG44TC5TC1TC7AG9CT15GA5AC24GA24AGAGCT5TACT6TAGC14TA18TG9GA1GA5AG19AC16AG19GT3AC1CG8GA6AGTA5AG30AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT22AG1G-G-G-A-G-G-C-G-T-G-A-C-11-T22GC21CT3TC5GT47GA6GA15 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,535,8565,9098,1,523,1.26e-164,578,88.037,471,plus,8TC5TC1TC6ACAG9CT15GA5AC24GA24AG1CT5TACT6TAGC14TA18TG5TG3GT1GA11TC13AC16AG13GA5GT3AC1CG8GA6AGTA5AG28GA1AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT12G-G-G-A-G-G-C-G-T-G-A-C-10AG12-T22GC21CT3TC5GT47GA6GA15 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,161,1,161,4772,4612,1.47e-54,212,95.652,154,minus,48GT11TA32CT11CT17AT16CTCT19 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,51,160,210,649,699,2.00e-12,72.5,98.039,50,plus,18AG32 -MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9719,9115,49,9137,649,9681,0.0,9873,88.195,8039,plus,18AG41-A23CG9AG11GA3TA11AG20AG26CG12AC3AG10TCAGCGCT11AG15GA48CT2CT12AG1GATA13CT2GA5TA2AG15GT44AG5GATC12AG7AG4AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC2AG8AG8AGCG27AG10AG28AG18CT50AG1AGAG19GA11AG11TG13AGAG6TG19CG22AGGA8AGAG19CT24AG3AG36CT10AG10AG1GA16AG13GATC7TC14AG18AGGA2TC28AGGA2TC2AG5GT8TG10AG18AG14TC14CT14AGAG7AG6TC46CT41GT5CTTA8GA4AGGA10AT1AG14AT30AG10AG17AG6AG7AG13AG26AG20AG7TC9CT14AGAG9CT26GA4CA14TC1AGAG2AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG3AG1AGAG10AG39AG7AG1AG11AG2AG12AG4AGAG6AG32GA3CT4AG4TC3AG14AG11AG2AG10AT12AG16CT3CA2AG22CT2TC8AG29AG3AG43GA6AG11GA4AG2AG5AG3AG8AT8AG5AG1GA8TC11GA31AG19CA13AG5AT8TC1AGAGAG8CT2AG49AG5AG23TC5CTAG10AG23CT15GA5AG1AGGA28AGAG3AG61GC31AG15AG18AG6CT14AG2AG17AG1AG2AGAGAG4CT38TC4AG3AGAG17AG23CGAT9CA10AG27AGAG1AG2GA2AG4AG6CT5CT2TC4AG11AG22AG23GA42AGGA24AG3CTAG33GA13AGGCGA2AG24GAAG23AGAGGA13CT3AG26GA24GA2CATC4GACG11AG1AG22AG2TC8AG7AGAG4TCGA1AG2AG23AG11AG3AG5CT17AG7AG28AG10TC12AG10TC2AG12AG8AG1GA8GTGA1CT3AG17TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG5AGAG1TC2CT7AGAG2CA12AG5AG2AG29AGGC1AG7AG12CT5AG10AG8AT8AG16AGAG68GA6TC5AG5CG1TC60AG5AG7AG21AG4CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG4AG4AG11AG2AG3AGAG1GA9AG5AG1TA14TC32TA28AG48TC18AG24AG10AG35CT14TA18AG22GA1AT31AG39TC33CA52AG21CA21CT2AG5AGAG7CAAG1AG4AGGT4CT9CT9AC1AC6AG2CT22TC2AG4AT2AT5AG7AC8AGAG32AG2CT8AC46GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6GC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG13AGGA2AG16CTCT12TC4CT2TC2-T10AG6AG9GA3AG1ACAG3TC22AG16AGCATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC13CT35TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2GCAC5CT10AGGC13GACT20AG3TC6TA1AC10AG6TA10AGGA24AC3GT27AG5C-G-3A-C-C-A-G-G-A-4TA8AC4AG5AG-G-G-G-G-T-G-G-A-G-A-T-G5TC1TA2TC5AG4AGGT7AC8CT1-C-A-G1CA2CA4AG17AG9AG5AG8TC36AG1GT6AGATGA14AC2CA25GA6GA7CT3AG1AT14CAAT29GA28AGAG23GA3CT18CG6TG9G-A-A-2AG2TGC-T-A-3TGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-2ATTG5A-T-G-A-C-3AGGA7AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT12GA2GA11G-2AT1T-A-G-T-G-G-A-A-7ACGA2A-A-A-4GA1AT3TC2AG24AG40TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG7AG4GA6TGAT2GC2CT2AGCA1TA7GA4AG8GA17GAAGAC1GA1TA1AG4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA7TG12AGAG9GA2AT2GA1TC3TC12AG3AGAG18AT7GA16AG1ATAT5AG5AG2A-T-G-7TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGAT2GA35GACT2GATC7AG2AGA-G-A-1CTA-A-C-5TC1GATC5TGAT1ACAG3CT6GA3AG2AG12AG8AG30CA15AG2AG11CA1TG22AG13AG1AG3CA1TAAG7CG6AGAG6AG20AG8GC3GA52AG14AG40AGAG24GA8TG1AG14AG15AGAG6AG9AG20AGAC6CT1AGAG4TC5AG3C-C-C-1A-G-A-T-A-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AG3AC1AG7GA7TC3GAAG1ATCT4TC1TCATAC10CG4AG2GA5AG6CA13CA5AG1CA9GA1AG11AG5AG4GA4TA3CA1GT5AG1AG10AT17AG8AG2AG17AG2AG4GT24AG4CT8GA2AG2GT7TA11AC22AG3CT8GA4AG6AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC32GAGA10AG8AGAG7AGAGAG2AGAG5AC2GC2GA7AG9GA7AG10AC13AT14CTAG7AC14AGAG9AG1AG11TG5AG3GCCT1TG11TG11CG1CA16AG4AGAGGACT13AG3AGAG5TG5GA3GTCATGCTAGGT1GACT1AG8GA1CTAG3AGAG13AG4A-G-G-C-C-A-G-T-A-A-G-A-A-A-G-C-C-A-12AGCA2AG3AGAG19AG4GA10CA1TC31AC1GTTG6CG12CG4AG2AGA-A-A-5AG13GC18GA14AG1GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA16AG7AG7TA7TAGCTC3AG9TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG7AG1AG2AG2AT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 -MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9719,597,8541,9137,1,596,0.0,658,88.610,529,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA16AG7AGGA6TA7TAGCTC3AG9TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG7AG4AG2AT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 -MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9719,9027,371,9347,622,9625,0.0,10818,92.279,8330,plus,27AGAGAGTA1T-2A-1CA1G-T-G-G-CA2CGCAGA1AGCGAG2TA1T-3C-3GA9GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9719,542,8815,9347,1,540,3.18e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9719,28,91,118,622,649,0.002,42.5,100.000,28,plus,28 -MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9719,9048,269,9266,600,9625,0.0,10863,92.352,8356,plus,5TC2GTGT2AGCTTC2AT1ATTGCGCA23C-TA1TA2TG1AC2A-2G-1TACG1CGTACA2TG4T-C-T-1TC2C-13GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9719,542,8734,9266,1,540,6.01e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9719,73,220,271,577,649,8.11e-04,44.0,71.233,52,plus,24-A-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T-G-G28 -OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9719,9720,18,9686,1,9574,0.0,11694,92.407,8982,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA164-G1TG5GA12TC31AG25CT82GA3AC97CT3AG14GT20TC8TC7GA28AG16TG35GA19CT5GC26CT8GA19A-C-A-C-A-G-G-A-A-A-C-A-G-C-A-G-C-C-A-G-G-T-T-A-G-A-C-8AC6GACT26AG6CA1TC89AG50TC11TC75CG1AG20CT76CG11GA27CT41GA8TC93AT70CT20AG41GA8AC5AG29CA12AGGC1GA16GA11AG12GACT27GA5TC1TC5AG99AG12CT4AG20CT24C-C-A-13TG8TC2TG2AT16TC7AG8AG17T-C-C-7GA9AGAG46GA26GA23CA4AG3AG73CT117TC8AG101AG14AG119GA69TC38AG37CT86TC22AT5CA2GA9AC2GA26AG29AG6GA13AG19AG7TC4TC2CA17AG26GT48AG1CA32AGCT7AG5AG32GA4AG21GA24GA4GA18TC19GA26GA51GC4AC10TA52GACT55GA8GA19AG1TC11GA3AG77CT2CT14AG47TC29AG6ATAT22GA1CT21TA10TC33CT19AG35CT5GA24AC21GA12AG5GA20CT59TC21TC19GT107GA23AG8GA27TC26AG49CT11GA20CT5CT41AT21AG2AGAC8AG21GA17CA203CA5CT6CT15TC40GA28TC26TA126CA30AG9AG23TA7ACAC8AG27GA1AG10CT61GA50CA26CT8TC11AC14TG3AT19TC47GA37GT9CT13AC3GA2AG5AG47TC14TC24GA27AT9AG11TC19AG14GA33TC7TC2-T17AG16AG3TC40GA34GAGA13CA3TC11AG2CT25CT8GC43CA6CA3AGGA11GC6GC1CT5CT24TC7TA2AC5TG14CT11GACT4CA26CA31GA24AC3GT27AG5G-G-G-G-G-A-T-C-3A-4TA10-T-G-T-G-G-A-G-A-T-G-G-G8GT6TC1TA10AG16AG10CAA-A-C-10TC29AG7AC37AGGA66GA5AGAGAT21TC6GA5AG22AG27TC16GA5TC13CG1CT4TG3-A-C-T-G-A-T-T-T-G-A-A-G-A-A-T-G-A-T10CA3GT5TC2AG1-G-A-A-T-G3CA1-G-G1CGCA2TG2AG-A-G2GA15TA3CT1GAAGAC3GAAG8AG4AGAT1-C5G-9CT8GA11GA4CA6GA1GT4AC2ACGC1A-T-A-A-G-A-G-T-A-A-T-A-A-T-A-T-T-A-4T-T-C-2GA3AG1TC6CT11TC8AG71GA6GA6ACAG14GA23GA14TA53CA13AG4AGGT10AG28AG2TCGAAC1AT5AG40TA2AC1CG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA1CT2AG20CTTACG9CA4CAAT21GAAGAC6GA2AG9AGGAGA1AT12GA7TG1CACA20GAGA6TC16AG30CA19ATATG-G-A-G-A-C-4GA1GT1TC5C-T-C-3TC2GA2AG7GA1T-A-G-T-G-C-T-A-C-T-A-T-C-A-4AG2TG2T-5TC2TA5AC4AC3TC1AG5GAGA12TA8GA33AGAT11CA4TC6CT18GATC12CT4AG2CAGC2CT1GA1AT18TG9AT76GA27GA8-A-G-T1AGCG1TA1GA6CT46GC3GA24TA21AG20AG66GA24GA45CT9AG14AG26AC1AG9AC1TC1TC18AC9GA20TC2AT5CA13GA14AG6AC21CA25GA10CT18AT14AG32AG37CT14CT4TC5CT4GA1TC29CA4GA31GAGT2CG14TC3AG6TA6TA3CT57GA40TC8CTGT6GA9AG8CT23CT11CT45AG2TG5AG18TG3TC7CG25GACT22AG13AGGTCG1AGTA11GA20AC5G-A-G-C-C-A-G-C-A-G-C-A-15GA30GA3CT24CG2AG37AG25GC33AG2GA61CA2AG9GT15GA4TC2TC8TC1TA11GA1GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 -OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9719,663,9,671,9077,9719,0.0,789,91.855,609,plus,3TG2CGTA22CA2AG9GT15GA4TC2TC8TC1TA11GA1GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA133 -OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9719,509,9178,9686,1,489,3.68e-161,566,89.194,454,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 +MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9718,9070,480,9481,576,9624,0.0,10871,92.271,8369,plus,26-G-A-C-C-C-T-T2-A-G-T-C-A-G-T-G-T-G-G-A15C-3A-1ACTC2G-G-C-TA1GA1TGAG2TCAT2GA1TG1CGTACA2TGAG2TA17GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9718,542,8949,9481,1,540,8.48e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9718,9034,70,9055,648,9620,0.0,10451,90.779,8201,plus,19AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA69GATC9CT2AG12AG1TGGA20CT6CAAG11AG20GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG13CA23GAAG28AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC8TC20GA2TC8GT8TG59CT14AG8AG6TC31GA2GA11CT47CTTA8GACT3AGGA21AG2GA2AT30AG4TC50GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA21GA10AG20AC1ACAG1ACTA6GAAG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA27CA8GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTCG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA20CA7CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA30CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC1CA26CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA25AGGACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT24GA23CT15TC2AG21GA2GT9CT5CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA20CT12TC4CT2TC19AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CTCA7GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2ACAC5CT11GC14CT24TC6TA1AC17TA11GA24AC3GT27AG5CA5CACA-T1GTGC2GC1AC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT4AGAT14CAAT29GA53GA3CT18CG6TG9A-G-2TG3-A-A-T-G-A2AC6TC3TAAG2AG1-A-G-C-G-G-G-A-G-A-A-T-G4CT3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT4GA7GA2GA2TC8GA1AT4G-T-G-G-A-A-A-T-A-4GCGA2A-A-A-4GA1AT3TC2AG24AG12AG27TA30GA4GAATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC1CT5AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG19TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA11ACA-6TC2TGAC7AG4AC6-G-A-A1GT12GA7TG23GA2AT2GA1TC3TC36AT7GA18-T-T-T3GA5-T-G2TGAT1TC2G-2TG3-C-A-A-A-T-A-A-C6TGCG2AG1AG4TA5AC30TA8GA9GA12TC9CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CTAC5GA59CA18AG11CA1TG20AG2GA18CA1TA8CG44GC3GA52AG14AG66GA8CG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8GT1CG7AC1AGGA6GA11GAAG1ATCT4TC1TCATAC10CGTA3AG2GA5AG6CA13CA7CA9GA16GA7GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC27AC7GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11CG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA10TA5GC4CG5AC34TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG3TG5AG5GT3GCACAGCG1CG8AG2GACG16TC18AG22AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 +MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9718,537,8519,9055,1,536,6.00e-175,612,89.944,483,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG3TG11GT3GCACAGCG1CG8AG2GACG16TC41AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 +MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9718,9022,565,9537,623,9624,0.0,10905,92.596,8354,plus,26A-C-T-C-TG4T-13TGAG20GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9718,542,9005,9537,1,540,6.18e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9718,28,370,397,622,649,0.002,42.5,100.000,28,plus,28 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,8983,200,9165,768,9675,0.0,10441,90.927,8168,plus,51CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC9CT2AG4CA7AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG2TA35AG28AG18CT73GA11AG10CATG2GA18TG19CG23GA29CT36CA25TA2CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA24GA2AT30AG10AG44GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG65CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC63CA19AT21CT52AG29TC5CTAG10AG23CT15GA7AGGA94GAGC55TC10AG6CT17AG18GA10CT38TC51CGAT9CA15AG25AG2GA14CT2AG2CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG47TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA2TA3CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGGC9AG12CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC110TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA19CTCT12TC4CT2TC19AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2GA2CACA-T1GTGC2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-2TG2AGT-C-T-A-3CGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11GA1AT1G-T-A-G-T-G-G-A-A-7GCGA2A-A-A-4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA7GA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT14A-T-G-7CAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG1AG3CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC1CT8CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC27AC7GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT12CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1AT2AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,592,8574,9165,1,591,0.0,690,90.878,538,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1AT2AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,129,1,128,778,650,1.18e-41,169,96.124,124,minus,19AT3CT21GC23-T41TC17 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,72,130,201,623,694,1.90e-21,102,98.611,71,plus,44AG27 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,48,9167,9214,463,510,5.46e-12,71.1,100.000,48,plus,48 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,48,9167,9214,9547,9594,5.46e-12,71.1,100.000,48,plus,48 +MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9718,9067,648,9663,640,9642,0.0,10107,89.324,8099,plus,27TGAGGA62AG22-A-A-A13AG20AGAG13TA24ACAG27AG10GA57CT2CT5TG9AT7AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC8AC4ACGATC1CG2GACT20GT12CA31GA19AG3GA20CT2TC8GA2AG23GA95GA10AGAG30GA75CG2AG8GA27CT20AG11GA30TC9AG49GATCCT17AT8TG10AG15AG2AG11AG32AGAG7AG2AT35GA17AG42AGAC2TC41CT28AG6TC100AG18CA3AG9AG4CT52TC1AG3ATGA6GA7TC18GA1GA5AG3GC11GA9AGAG40AG5GA35CT17AG16AG17AGAG11CT30ACCTTC68CA6TC14AG4TC20TC8AG12CA7AG8AG3AG67AG8AG3AGAGAG2GA12AG61AG19AGGA11AG16AGAG12AG10CT6AG13GA6AG10AG5AG18AG11AG9AG33TC3AG9AG35AG4AG30TC24GA32AG5CT9AG17AG25AG11CTTC6AG2AG1AG2TC1GT11TC20CT8GT5AGAG52CA5TC27CT4AGAG1AG11AG14TCGC3AG9GA2AG19AG4GA7GA11GA4AC38AG3AG22AG36GATA11AG10GA50GA10CT3AG3AG64GA5AG8CT4GA9AG8GA2AG7AGAG2TA2CA1AG9AG16AG6CT4AGAG8CT25AG6AG5AG5GA2TC2TA14TC12AG10TC1AGAG12AG21GACT14GA6TA31AGCT1GA10GA6AT11AG39CT2AG4AC18AC1GA12AT46CT2TG4AG16AG5AG2AG32AG13CA12AG19AT2GA3AG12AG5AGAG45AG13TC11CT9AGAG8CT4AG20AG11TC34AG21AG31GA8AG11CT2CT2CT17GA1AG6GA3GA10AT8AC1CG10AG12AG11AG2AG3AGAGAGGA13GT3CA25AG45AG35CA93CA19GA46AG4GA25AG2TC2TC79AG61CA32CTAG5AGAG6CTCAAGAG28AGTC35GA34AG33AG5AG19AG1GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG51AG7AC22CT5AG10GAAT25CTAT5TC11AG22AG10AG7AG1GA4TA31TC12AG4CT1AG16AG1CT24AG18TC34GA3CG10AT14AG2CT25CT8GC46CG3CA3AGGA18TCATCT5CT9GA7TC11TC2TA2TCACTA3TG2AG23GACT4TA15AG1GT8CA12AG11AG6GA1GA6TC15AC7TA1AGGA32TACAAT1GT-C2GC1GC2AG1CGAGGACG2TGTG-G-G2AG5AG5TC10AG1AG13AG4AG2GA4CACA1GA1GT19AGAG14GAAG7AC37AGGA8CT11AG43AG5AT1AG1AT6AG6GA16GA3AG10TA28AG9TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CGTCTGCGTG1-G-A2AGCA2CA1TG-G2-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG1AGAC1AG6GTCAGT3CT11AC5TA2GA2GCAC7G-A-2AT2A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT15AG18TA13AG7AG8GA13AC5GA5AC27GA12AG6AG55AG1GA10AT4AT4AG6AG6AC13TC4ACGAAC1GT1CTAG2CGGA4TATACT4TC27TA2ACACAG3-C-C-A-G-A-G1AG7AG9TGAT5CT4GA1T-A-T-4AG2GA1CT2AG2GA21GA1-A-G-C3TA4GA23CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT5AGAG9GA8AG18AGAG1AG4CT5TC9TA2TCCA15CT1AG1ATCT3AT1A-T-G-5GTAGTG3TAGC-T1CA1-G-G3TA3GA1TC3CG1GAAGAGTA3AG1TC-A-C-A5AC4AC25CA8GA5AG29AG9AGCA3AT19AGGC1TA12AG1GTAG1GT3-A1AC3TA1-T-G-A-G-T-C-C-G3CT3TC9AG3AG1AG6AG3TC12AG24GA13AG2AG19AG20GA11AGAG2CA8AT8AGAG6AG8CAAG10AG8GC2GA2AGGA9AT11GA1GT1CA17AG20AG21TC18AGAG5TC18GA10AG12CA16AG2AGCA4AG9AG20AG9AG4CGGC6AGGA3G-G-C-4C-A-A-A-A-2TCA-C-A-A-A-A-G-3AG2TAGC1CG4AG1GA2AC3TC5AG3AG4AG3AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG3AG24CA11AG11AG5AG4GA5TA2CA1AT18AT25AG3AG39AG9AG5CT11AG10TA7GA7AG3GC14AG3TCAC6AGGA4AG12AG2GA7GAGT17TC3AG10AG9AG8AG26CA17GA1TCCG1AG15AGAG6AG1AG3AGAG16AG2AG9GA5CT1AG27CT11CTAG7TC4TC9AGAG9AG1AG1AT6AG2TG5AG2AGTC1AT8TA3TG12GA17AG4AG1GACT13AG24AGAT1GA2AGAG2AG1ACAC1GA1AT2GA1AGAG8AG2A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-A-A-G-A-23AG3AGAG11AC7AG6TC8CA1TC7AGGC14TC7AC24AG6G-A-T-5AG13GC7TG13CA8TC2AG6CG7GT39GA2TC9AG3GA41TC33AG2AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT4AG18AG7CT3TA6AG14CA12AG11ACAT11TA2AT3AGGA11AC6TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 +MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9718,558,9120,9663,1,558,4.74e-171,599,87.993,491,plus,11GA2TC8ACAG3GA41TC10GA22AG13CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT4AG1GA16AG7CT3TA6AG14CA24ACAT11TA2AT3AGGA11AC6TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 +MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9718,9070,541,9544,577,9624,0.0,10845,92.161,8359,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG1AC2A-2GA1TG1CGCATA1CGTGCGCA2TC1TACG2CG10GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9718,542,9012,9544,1,540,3.24e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9718,8889,661,9500,755,9625,0.0,10721,92.496,8222,plus,3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG81A-T-G-G-G-21AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC39AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 +MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9718,544,8966,9500,1,541,1.71e-174,610,89.890,489,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 +MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9718,99,9492,9589,4443,4345,9.70e-29,126,94.949,94,minus,4GT7GA36AG20CT9-A18 +MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9718,9087,581,9617,577,9626,0.0,10878,92.253,8383,plus,26-A1TC2ATGTCT3GCGACGGTCGCTCG3C-A-G-21G-G-A-C-T-C-T-G-G-T-3T-2AG2T-3C-A-C-TG3TG1T-A-1CA1GATG2CAGACA1GC7A-8GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9718,544,9083,9617,1,542,1.19e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9718,9068,479,9485,577,9624,0.0,10905,92.402,8379,plus,25A-C-TG1ACACTCCT1CT3-T5CT1C-C-C-3CA1G-G-G-AT40TGAG20GA29AG20-A-C-T-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2GT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA24GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA29TC5TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTTA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA13GT4AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 +MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9718,542,8953,9485,1,540,6.15e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 +MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9718,9071,349,9353,577,9624,0.0,10887,92.316,8374,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG2TCAT2G-1TACG1CGTACA1AGAGTGCA19GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9718,542,8821,9353,1,540,8.37e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,8942,204,9098,747,9607,0.0,10391,90.930,8131,plus,2GT2TG1AC15TC48CG2CA8CTACAG27AG4GA4CAGA45CA8CT2CT29CT1AG7AC7AG2CA6GT50GATC12AG5GA8TGGA4GA2TC5AG14AG32GAAG14G-C-C-12AC3AG2GACT2AG17CT14GC5AG26CT5CTCT20AG13AT14AG18CT7GA92GA32GT5AG3GA16AG2GA55CG10CA10CTGA16CT18TC5CT16GA12GATC7TC58GA11TC17AG6GAGA51CT22GCAG38GA9AG13GA8AT16CT4GAGA1GT2CGAC1GA27AG14CT9CT23TC1TC29GA42CT2CT29AG12CT13GA8CT35G-G-A-G-A-G-C-C-T-C-A-G-G-C-C-A-A-C-A-G-C-C-C-C-A-C-C-A-G-T-14TC5AT7GA2GA1CT3TCTC12AG4GT9GAAC3CA3CT3GA9AGAG19ACGC1AC24AC19CT33GACGGT75GCCT9TC14AT2TA32TC17AG38TC8AG14GA27AG58AG14AG14AT27AG31GA80TC5AG18AG25CA26AC32CT81TA16AC29AC23CT56AG2AG3GCGA11AG6GATC28GA43GA19AGAT9GA5AC1TG33AG8CT23AG10AGAG20GA12TC58AG39AT7AC23AG11GA56GA53GA6TA1TC44AG25TC12CG40GA3TC6CT4AG66TG4TC30AG5GA1CT14GA13AC9CA5AG5AT15CTTA6AT11AG10CT9GA45AC21GA34AG4CT3AG16TC20GA21AG4GA2TC9TC21GA9AT2GA7GA36CT68TC12AG25GA14CT12AG82CT3AC1CT41AT21AG2AG1CT2AG4AG21GAGA16TA17GA11GA32AT11CA50TC59TC45TA13CT27GA28TC20GA11GA41AG17CA60CA30AGAG4AG3AG27GA3AC9AG37GAAGGA6GA17TC4GTCA4GA5GA38AG3GAGA9AC5CA2GA6AG1CA24CT10TC11AC12CA1TG3AT10TC1GT54GA22GT1GA37TG5AG53TC28AG2AG6CA1GT11GA12CACTAT5TC3AG11TC34GA20GT20TC19AG16AG3TCCT1CG22TG13AGCA35GA10AC25CT21CT1CAGC5GC35GA1AC5GA2TG3TA1AC1AGGAGA1CA5GA9ACCT33TCTA1TC2TA1A-G-A-1GCTC13AGCT16GAGT22AT8CA1TC40AG1AT2CA8AC3GT33G-G-G-G-G-A-T-C-3A-4TA1GA5GA14-G-G-T1CG1CG1ATTG1CGTG18AG2AG5TCAT3AG10CA34AG5AG8AC11CT90AG1GA5AGAG46TA2AG5AT5CT3GA4CT52CGCT5TG6AG5A-C-C-A-T-T-G-A-G-C-C-A-2CG4CA6ATGA6TG4-A-G-C5-A-A-T1TA2GAAT2GA9AG2GA1CA16GA3CG7CA6AG4AGGT1AC14CT1CT15GA2GA2GC3CT2GA1GA1ATAG3AC2AC5TA2GA5TC9TC7ATGC26AC5AG47GA6GA4AG1AC16ACAC5ACCA10TC82GA9CT7TA1AG6AG4GA22AC1AT6TA33-A-A-AGA4-T-C-C4AC2TG1TG2CG16TGAT1GA3CT4G-A-T-1TA7GA4AG3AC21AG2AC1GA1TA7CA9CA3GA1GA4AGAC6CAAG11-G-A-A1GT3GACA7GAAT6AG1CA29TC40AT4GAGC4AG3TACA1TA1GT1-CAT2CG1ATCT2CT1AGAT3-T-G1TATG4T-G-3TG1CG1A-6GA2AC1AG1TA3-A-G-T-G-A-C2CA4TCAC8TC29AGGA1GA29TCCA19GA14AG23GT1CA2A-C-1GCGA3GAGT2A-C-A-G-1ATACTC4CT15GA3AG6AG30CT9GA5AG65AGCGCA9AT14CT4GA26AC3CA46AG12CT10GT11GA32AC2AG15GA16GA7GAAG26CT17CT9AG14AGTC14GA1AT5AG1TAAC1CG6GA1CTAC1TCTATC3TC6CG7TC1CG20AG1ATAT4TC2CTACAC3CA4GA3GT4GA8GA43AG16GA5TA4CT11CT6AT8TA1AG14AGAG20AG37CT22GA1TC5GATC67GAATCTAC15TC4AG12TA7AC94AC18GC4GA2AG41AC16TC22AG8TG3CT4AG2AGTC9-T-A-T-T-C-G-C-C-A-C-A-T-A-C-C-T-A-G-A18AG5CA33CAAG4AGAT2GT2AG4GC2GAAC16GACG2AG1AG5GC11GA12TC9TC7GA31AG3AC15TC43AC9GA5GA11CT7GC4TG44TC5TC1TC7AG9CT15GA5AC49AGAGCT5TACT6TAGC14TA18TG9GA1GA5AG19AC16AG19GT3AC1CG8GA6AGTA5AG30AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT22AG1G-G-G-A-G-G-C-G-T-G-A-C-11-T22GC21CT3TC5GT47GA6GA15 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,535,8565,9098,1,523,1.26e-164,578,88.037,471,plus,8TC5TC1TC6ACAG9CT15GA5AC24GA24AG1CT5TACT6TAGC14TA18TG5TG3GT1GA11TC13AC16AG13GA5GT3AC1CG8GA6AGTA5AG28GA1AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT12G-G-G-A-G-G-C-G-T-G-A-C-10AG12-T22GC21CT3TC5GT47GA6GA15 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,161,1,161,4772,4612,1.47e-54,212,95.652,154,minus,48GT11TA32CT11CT17AT16CTCT19 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,51,160,210,649,699,2.00e-12,72.5,98.039,50,plus,18AG32 +MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9718,9114,49,9137,649,9680,0.0,9883,88.227,8041,plus,18AG41-A23CG9AG11GA3TA11AG20AG26CG12AC3AG10TCAGCGCT11AG15GA48CT2CT12AG1GATA13CT2GA5TA2AG15GT44AG5GATC12AG7AG4AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC2AG8AG8AGCG27AG10AG28AG18CT50AG1AGAG19GA11AG11TG13AGAG6TG19CG22AGGA8AGAG19CT24AG3AG36CT10AG10AG1GA16AG13GATC7TC14AG18AGGA2TC28AGGA2TC2AG5GT8TG10AG18AG14TC14CT14AGAG7AG6TC46CT41GT5CTTA8GA4AGGA10AT1AG14AT30AG10AG17AG6AG7AG13AG26AG20AG7TC9CT14AGAG9CT26GA4CA14TC1AGAG2AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG3AG1AGAG10AG39AG7AG1AG11AG2AG12AG4AGAG6AG32GA3CT4AG4TC3AG14AG11AG2AG10AT12AG16CT3CA2AG22CT2TC8AG29AG3AG43GA6AG11GA4AG2AG5AG3AG8AT8AG5AG1GA8TC11GA31AG19CA13AG5AT8TC1AGAGAG8CT2AG49AG5AG23TC5CTAG10AG23CT15GA5AG1AGGA28AGAG3AG61GC31AG15AG18AG6CT14AG2AG17AG1AG2AGAGAG4CT38TC4AG3AGAG17AG23CGAT9CA10AG27AGAG1AG2GA2AG4AG6CT5CT2TC4AG11AG22AG23GA42AGGA24AG3CTAG33GA13AGGCGA2AG24GAAG23AGAGGA13CT3AG26GA24GA2CATC4GACG11AG1AG22AG2TC8AG7AGAG4TCGA1AG2AG23AG11AG3AG5CT17AG7AG28AG10TC12AG10TC2AG12AG8AG1GA8GTGA1CT3AG17TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG5AGAG1TC2CT7AGAG2CA12AG5AG2AG29AGGC1AG7AG12CT5AG10AG8AT8AG16AGAG68GA6TC5AG5CG1TC60AG5AG7AG21AG4CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG4AG4AG11AG2AG3AGAG1GA9AG5AG1TA14TC32TA28AG48TC18AG24AG10AG35CT14TA18AG22GA1AT31AG39TC33CA52AG21CA21CT2AG5AGAG7CAAG1AG4AGGT4CT9CT9AC1AC6AG2CT22TC2AG4AT2AT5AG7AC8AGAG32AG2CT8AC46GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6GC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG13AGGA2AG16CTCT12TC4CT2TC12AG6AG9GA3AG1ACAG3TC22AG16AGCATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC13CT35TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2GCAC5CT10AGGC13GACT20AG3TC6TA1AC10AG6TA10AGGA24AC3GT27AG5C-G-3A-C-C-A-G-G-A-4TA8AC4AG5AG-G-G-G-G-T-G-G-A-G-A-T-G5TC1TA2TC5AG4AGGT7AC8CT1-C-A-G1CA2CA4AG17AG9AG5AG8TC36AG1GT6AGATGA14AC2CA25GA6GA7CT3AG1AT14CAAT29GA28AGAG23GA3CT18CG6TG9G-A-A-2AG2TGC-T-A-3TGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-2ATTG5A-T-G-A-C-3AGGA7AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT12GA2GA11G-2AT1T-A-G-T-G-G-A-A-7ACGA2A-A-A-4GA1AT3TC2AG24AG40TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG7AG4GA6TGAT2GC2CT2AGCA1TA7GA4AG8GA17GAAGAC1GA1TA1AG4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA7TG12AGAG9GA2AT2GA1TC3TC12AG3AGAG18AT7GA16AG1ATAT5AG5AG2A-T-G-7TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGAT2GA35GACT2GATC7AG2AGA-G-A-1CTA-A-C-5TC1GATC5TGAT1ACAG3CT6GA3AG2AG12AG8AG30CA15AG2AG11CA1TG22AG13AG1AG3CA1TAAG7CG6AGAG6AG20AG8GC3GA52AG14AG40AGAG24GA8TG1AG14AG15AGAG6AG9AG20AGAC6CT1AGAG4TC5AG3C-C-C-1A-G-A-T-A-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AG3AC1AG7GA7TC3GAAG1ATCT4TC1TCATAC10CG4AG2GA5AG6CA13CA5AG1CA9GA1AG11AG5AG4GA4TA3CA1GT5AG1AG10AT17AG8AG2AG17AG2AG4GT24AG4CT8GA2AG2GT7TA11AC22AG4AC7GA4AG6AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC32GAGA10AG8AGAG7AGAGAG2AGAG5AC2GC2GA7AG9GA7AG10AC13AT14CTAG7AC14AGAG9AG1AG11TG5AG3GCCT1TG11TG11CG1CA16AG4AGAGGACT13AG3AGAG5TG5GA3GTCATGCTAGGT1GACT1AG8GA1CTAG3AGAG13AG4A-G-G-C-C-A-G-T-A-A-G-A-A-A-G-C-C-A-12AGCA2AG3AGAG19AG4GA10CA1TC31AC1GTTG6CG12CG4AG2AGA-A-A-5AG13GC18GA14AG1GC4CG5AC34TA9TC5AC13CT15CA5AC22CT18AG7AG7TA7TAGCTC3AG9TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG7AG1AG2AG2AT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 +MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9718,597,8541,9137,1,596,0.0,658,88.610,529,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA16AG7AGGA6TA7TAGCTC3AG9TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG7AG4AG2AT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 +MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9718,9026,371,9347,622,9624,0.0,10828,92.311,8332,plus,27AGAGAGTA1T-2A-1CA1G-T-G-G-CA2CGCAGA1AGCGAG2TA1T-3C-3GA9GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9718,542,8815,9347,1,540,3.18e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9718,28,91,118,622,649,0.002,42.5,100.000,28,plus,28 +MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9718,9047,269,9266,600,9624,0.0,10873,92.384,8358,plus,5TC2GTGT2AGCTTC2AT1ATTGCGCA23C-TA1TA2TG1AC2A-2G-1TACG1CGTACA2TG4T-C-T-1TC2C-13GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9718,542,8734,9266,1,540,6.01e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9718,73,220,271,577,649,8.11e-04,44.0,71.233,52,plus,24-A-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T-G-G28 +OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9718,9719,18,9686,1,9573,0.0,11704,92.437,8984,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA164-G1TG5GA12TC31AG25CT82GA3AC97CT3AG14GT20TC8TC7GA28AG16TG35GA19CT5GC26CT8GA19A-C-A-C-A-G-G-A-A-A-C-A-G-C-A-G-C-C-A-G-G-T-T-A-G-A-C-8AC6GACT26AG6CA1TC89AG50TC11TC75CG1AG20CT76CG11GA27CT41GA8TC93AT70CT20AG41GA8AC5AG29CA12AGGC1GA16GA11AG12GACT27GA5TC1TC5AG99AG12CT4AG20CT24C-C-A-13TG8TC2TG2AT16TC7AG8AG17T-C-C-7GA9AGAG46GA26GA23CA4AG3AG73CT117TC8AG101AG14AG119GA69TC38AG37CT86TC22AT5CA2GA9AC2GA26AG29AG6GA13AG19AG7TC4TC2CA17AG26GT48AG1CA32AGCT7AG5AG32GA4AG21GA24GA4GA18TC19GA26GA51GC4AC10TA52GACT55GA8GA19AG1TC11GA3AG77CT2CT14AG47TC29AG6ATAT22GA1CT21TA10TC33CT19AG35CT5GA24AC21GA12AG5GA20CT59TC21TC19GT107GA23AG8GA27TC26AG49CT11GA20CT5CT41AT21AG2AGAC8AG21GA17CA203CA5CT6CT15TC40GA28TC26TA126CA30AG9AG23TA7ACAC8AG27GA1AG10CT61GA50CA26CT8TC11AC14TG3AT19TC47GA37GT9CT13AC3GA2AG5AG47TC14TC24GA27AT9AG11TC19AG14GA33TC7TC19AG16AG3TC40GA34GAGA13CA3TC11AG2CT25CT8GC43CA6CA3AGGA11GC6GC1CT5CT32TA2AC5TG14CT11GACT4CA26CA31GA24AC3GT27AG5G-G-G-G-G-A-T-C-3A-4TA10-T-G-T-G-G-A-G-A-T-G-G-G8GT6TC1TA10AG16AG10CAA-A-C-10TC29AG7AC37AGGA66GA5AGAGAT21TC6GA5AG22AG27TC16GA5TC13CG1CT4TG3-A-C-T-G-A-T-T-T-G-A-A-G-A-A-T-G-A-T10CA3GT5TC2AG1-G-A-A-T-G3CA1-G-G1CGCA2TG2AG-A-G2GA15TA3CT1GAAGAC3GAAG8AG4AGAT1-C5G-9CT8GA11GA4CA6GA1GT4AC2ACGC1A-T-A-A-G-A-G-T-A-A-T-A-A-T-A-T-T-A-4T-T-C-2GA3AG1TC6CT11TC8AG71GA6GA6ACAG14GA23GA14TA53CA13AG4AGGT10AG28AG2TCGAAC1AT5AG40TA2AC1CG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA1CT2AG20CTTACG9CA4CAAT21GAAGAC6GA2AG9AGGAGA1AT12GA7TG1CACA20GAGA6TC16AG30CA19ATATG-G-A-G-A-C-4GA1GT1TC5C-T-C-3TC2GA2AG7GA1T-A-G-T-G-C-T-A-C-T-A-T-C-A-4AG2TG2T-5TC2TA5AC4AC3TC1AG5GAGA12TA8GA33AGAT11CA4TC6CT18GATC12CT4AG2CAGC2CT1GA1AT18TG9AT76GA27GA8-A-G-T1AGCG1TA1GA6CT46GC3GA24TA21AG20AG66GA24GA45CT9AG14AG26AC1AG9AC1TC1TC18AC9GA20TC2AT5CA13GA14AG6AC21CA25GA10CT18AT14AG32AG37CT14CT4TC5CT4GA1TC28TC5GA31GAGT2CG14TC3AG6TA6TA3CT57GA40TC8CTGT6GA9AG8CT23CT11CT45AG2TG5AG18TG3TC7CG25GACT22AG13AGGTCG1AGTA11GA20AC5G-A-G-C-C-A-G-C-A-G-C-A-15GA30GA3CT24CG2AG37AG25GC33AG2GA61CA2AG9GT15GA4TC2TC8TC1TA13GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 +OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9718,663,9,671,9076,9718,0.0,792,92.006,610,plus,3TG2CGTA22CA2AG9GT15GA4TC2TC8TC1TA13GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA133 +OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9718,509,9178,9686,1,489,3.68e-161,566,89.194,454,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 OQ092463,Ref.B.TH.90.BK132.AY173951,0,9605,8996,8952,688,9605,1,8896,0.0,10987,93.186,8342,plus,4TC12GAAG12AC45-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T-G-A-G6-A-A-A-A48GA15GC16AG1GA10AC24AG36GA2GA20GA2AG9AG17TC3AG13TACG26AG16GA5AGCT12GA14TG26TG14GA20AGAG17GA6G-2A-C-5C-C-A-G-A-C-8CTCT23GA2CT2CG68GA125AG144AC19AG8CT2TC21CT38CT26TC31AG14AG3TGGCTCAT31AC2AG14AG11CT20AG53AT2TC8AG14AG17AG4CA1CT3GC17GA9CT8GA7AT15CT17TC5TCACAG18AG2AG1GA11AG9AG23CT5GA44GA35AG13AC21GA30CA1GAGA13GA9GA2TG6GA74AG23CA4CA63GA54GA35CT4AG5AGAC22CT107CT23GA32TC77GA53AG11GA8AG56GA20TG4TC79AT124TG3TC1AG16AG21CT38AT32GA9TC4AG5GA5TC80AG26GA28GA3AG11GA30CA26AT7CT11GATA61GA8GA17AG23GA3CT23AG37GA2TC16GA12CA47AG23AG20GA5AG2TC17TC14TG2AG38TG38TC11GA23TC32CT66TA4TC1AG12AG9AC7CA5AC26AG63TC25TA2CG5GA20GA68CT3TC7GA17AG29GA11CT44GA54AC30CA32TC9AG8CT5CT32TC38GA20CT35GA22ATCT83AG30CA67CG140GAGA33AG6GA16GT1TG4AGGA9GC1CA2TC26TA2CT11GA2TG2GT1AGAC10CAAG32CA5CT8GA20-G6G-7GA15TA25GT30CT22GA21TA48GA9TG9AG28AG53GA65CT6CA11AG1CA9CT12CAAT5AG2TC17AG7CT36AG10AG18CT1TC2AT2GAGA18AG15TC33GA3TG7CA1TA4TC8GACA1GA28TC2CA5GC50AC3AG3AC41CT10ACCT5GC6CT2CG22AGTG31CA31AG12AT15GT30CT2GA2GA14AG7T-T-G-16CTGCAT13GA8CTTA8AG7AT47TC13AG23GA6GA17TC49GT12GA8CY7AC4GA6TC42CT23CT17GA9AG3A-1AG1TG1A-C-A-C-C-5CT4GA6G-A-A-T-A-C-C-A-C-C-C-C-7AG1T-G-C-T-A-G-T-A-G-2GA5GT1AGTA2GC1GA10AG30CA4AGGA5AT27GA2CT16GA16TC35AC53AG26CTAG12AG4TACAAC10CA13AG21GA9GA11AG3TC26AG22CTTA28TG5GA2TATC12CA5TC6CT6AT7AG5TA3CA15AG2CT2TA2TA1GA9CACA19AG12AC4AG2AGAC2GA19AGCA6TG7GA4GA10G-G-G-2TC5GT6AG7TGCA1CA28CT5AG5AT20AT7AT2TA26GAAGGC3-G-A2TGTACATA2-A-C2AT3T-3TGCA2A-T-G-1CA1CA24GA6AG5CA40TCAG6TACA4AG3TCTA1AC8CT12AT13TA2GT2ACAC1TA4AG2GC4AGCACG2CT2GA2TC10AG14AG19TC38AG10CT54AG50AG1AG22AT34TC77CT1GA38AG26TC42AT7ATCG8GA35GA11AG4GA8TC44AT3TC2GC46GC41CA18GA5GA4GA10CT6AG40CT27AC1AG8GA29GC8CGAC6AG1CT15AT10CT7GA76GA11CGTC6GA17GA33AG10TC5TC5CT23CT3AG21CT1GTGAGT6TA15GC6AC37GA1TC13GTTG4T-2T-T-G-G-A-9AG17CA2GA2GA7ATG-C-A-17GA104-G-G-G12TC7GAGA29TC4CG4GC44TC13GAAC34CT29CT18AG1AC4ATTC32GA14TC23AG2GA6AT21TA12TA5AG15GA1AG4GAAG8TC11TG18CATA21TC8CT52GT75TG12 OQ092463,Ref.B.TH.90.BK132.AY173951,0,9605,8996,576,38,613,8421,8996,0.0,756,95.833,552,plus,11GA11AC34CT29CT18AG6ATTC47TC23AG2GA6AT21TA12TA21GA1AG4GA9TC11TG18CATA30CT45TC6GT89TA98 OQ092465,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9659,8890,8931,654,9563,1,8890,0.0,10476,91.278,8152,plus,18TA2CT13A-32T-TC11GTGAAG42CT32AT9TA1AT47GA26GA26AG16AG10AG19AG8GA2TC17GT5AG6AG17TC23CA30AT13AGCT19CA7TG8CT5GA49TC13AG3AG11AG2GA33TC2CT20GAGC2AC31AG2AG13CG3CT1GA39AG5CT8CT12CT4CT41AC29TC5GA17GA5TCGC16AG5AT11CT5AT5TA7CA16GCGA11AGTC2TC6AG7AG23AC5GA7AC2AC1AC5AG1GA8TC3AGCT7CT9GA6AG5GA2ACTCCTCT25AT6TC6GCCTCT2AG14GA6AGAG12AC2AC2AG5CT1AC6AG5AC2CT2CT5TCAT10AT2AG2AC4CGAGGC2AT4AT6AC3TC3ACGC1ATTG3AC16GA7AG14AT2AG12GATC5CG1CG3GC2C-C-A-12GA1GA1CT2TC2CT1GA1AG9AGGA1CT6GA5CT2CT14GA2TC5TC25GA21AG8CT11TC8GA22AGGA2CT17GA5AC8TC11AG9AT12CA15CT21TC40AG10GA20CACA1CA6AG9GA3GA2AG1TC18CT32GA1CA11GA47GA10CA1GC3CTTCTCGA4AC2CT8TC2AG4TC9TA8AG41AG5TC2CT11TC102GA7CT23GA32TC29AG38AG10GA117AG2CA116TC100GA16AG4TG3TC1AG14GA1AG42TC17GT42TC10AG5TC8TC14GA5GA29CT11GA4AG11GAAG7AG9GA11AG15AGGA33AG39AT19GATA13AG3GT55AG10TC3AG11TA14GA8GA15AG30CT6GA6CT1AG8AG1GA3AG8CA10CT81GA29TC11TG8CT5GA6TATA22AG1TC20CTTC4AG2TG5CA18TC10TC3CT20TG4AG20AC58AG12AG17CA5AC2CTCT73GA2AGGA34TG2TA27GT29GA37CT3TC7GA44AG2GA59TC35GA68TCGA15CATC2AG47AT27GA16AG14CT35GA8AG13AT3AT44GA45TC20CA64TG144GA8AC18AG5AG6AG8AG1GAGAAT3AG7GA11CA2TC1TC1AC6AG15TA20AT5GA3AG3CT3AT87GA9GA11GA9TC8CT56TA5TG32GA27CT2AG39AG34AC3CT53GA23CT8GA8AC2CTAG7GA17AT5AG53TC7TA9GA23CTCATC2AG2GA35TC13GA2TC5AG17TC6TACATA2TC2TC5GACA86GA3AC6CT16CT12GA9GT13ACCT5GCTA5CT27GA21TA7AGCT1CA23AG7AG18TG8GA32GA5TC12T-C-A-G-C-A-2TGG-T-T-5GA8CT29GACT3AG5AC3TC15TC8AG18AT1TC5TCCT21AGAC3TGAT2GATC17GT5TC26CT8AG3GA9GA12GA21GA10AT2GA8GA26TC5AG35GA13AGTG4ACCT3GAGA1GACACGATATTG3AG1CT3AGGA8CG2CGC-A-C-C-C-C-3TA1C-C-A-C-T-G-T-3T-2C-2GA4GT2TA2G-G-G-1A-G-G-6AG18AG5AT5CA2AG2GA25CT7GA2CT4AG11GA5AGCA4-A-C-A-A-G-C4GCGATC6GA24GA15AT7GA21GA17AC13CTAG6CAGA9TA22CT25GA51GA5AG20AGGA12AC12TG6AG2TA17AGTA25AG6CA1AC1GA3CTCTAT4AG6TG1TA11CACA24CT7ACAC6AG3GA6AG1TA9GA1GA1AG1GA2TG3AC3GA3AG11GAGAGA3-C-A-A5GA7TC3TCAG3AT25GA1AGACCT5AG3TC1AG15TC15TA2AC1AG4TA8CA1TA4TG-C-A-G4CA2GA1TGAG-C-A-C6GTGAGA1GA1AT3-A-G1CA1AT2-T5CT1CA24GA12CATG41GC4CGTCCA4AG5CT9CT8AGCT19T-11GAAT1CTAGCT1GCA-C-A-C-T-16TG7AG6AG48AG9AG56TA-C-A-A61AG14GA35GA32GA59GA29GA2AG26TC24GA17ATAC3GAAGCAATCG1GA6GA1TC17AG27AG2TG9CACT12TG27TA10GC4AG4ACAG24GA10GA17AG26GA26GA2TC7CT36TC7AG11CA18AC1AG11GA20GAAG9GAGT1CACG6GAAG1CT14TC7TACA5GA53AG6AG20GA11CGTC6GA5GC34AG10AG4CT11TC5CT17GA18GA2TG6GT1GACTATGT1GT6TA17AC16GA5GA7TA4AG21AT4TCGA3TG3AG3CA2AGACATAG20GA11GA1AT2AG25CT10CT19CT23CT8TC32GA5TC2TC8GA29TC2GA1CG4GT70TG21CA10CA27CACA30TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GAAG8TC5GA7AGTC3AG1GA3CA19CT5GA11CT4CT8AT10GA20 OQ092465,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9659,8890,382,66,447,8509,8890,8.94e-130,462,92.147,352,plus,36TG21CA10CA27CACA30TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GAAG8TC5GA7AGTC3AG1GA3CA19CT5GA11CT4CT8AT10GA20 -OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9719,9788,1,9708,1,9719,0.0,11340,90.785,8886,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC7A-32TC6TC5TGAGGA39-A17-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T-G-A-G7T-75CTACAG43CA1GACT28AG5GA5TC11CT17GA2GA17AG2GA2AG5GA2CAGT1TC25AG4CT3TA1CA33AG7GA1GA11AG11GC20GC14GA14CA12AC1TC1AG2GACT35GC5AG15CG2CA35AG7TG11TC8AG12AT37TC87TG1AG11GT9GA4GA9CA1AGCA4GA34AC9GA7CG10CA11GA16CT15CA1TC29CT5CTGATC17AG60TC5GA11TG35GA29GA8AG8AG6TC41AG7AG33GA5CT6GC27AG12CACT1AG13CT11GA5TC1TCTA2TC1AG23GA76GA11CTGA6GA14CT49TC5AT6GA9TC7AG1CA31GA10AG40AG26CT20TA13AG11AG6GA95GA50AG5CT32AG40GA43AGCT15AG14AG5CT36AG16GA5TCGA3AC54TC29TC2TA69AG1GA26AC8CT1CT27CT14GT53TC2GA35TC20AG8GA27GA13AG14AG4AG7TC67CT24TG28TC23AG8CT23AG2CT11GACT16GA23GAGA12CA30GA50TC12CA51AT21GA14AG3AG14AG32GA1TC42TC1AG24GA9TC30AG11CT21CT13GA2AG14GA11TC23TC5AG30GA1CT1AG19CA7GT24CT11CT19AG66AC1GA11AGCT6GA24GA14CT53GA59AT44CT15AG10GA14TC5CT9TC40TA11GA15CT2AG8AG61GA8AG11CT5CT2GA38AT21AG2AGAC1GATC5AG3TC17GA5AG11CA25AG4AG55AT36GA56AG28CT63GA28TC77TC2CT72GA14TC6CT2AG1AT3AG9AG1AGAGTA5GT21ACTC51AG25TA52GA3GA9AC17CA29TC5TC11GC14TG13GATCGA7TC30CA16GA12AG21GA2GT23GC50AG9TC11GA7AG11AG5AG1GA27AT5TC5AC2GA2AG2GA14AT62TC2-T12AG21AG3AC2TG15GA6TG14CA35GA17TC14CT28AC5GC49TCCA3AGGAGA4GC12TC7CT24TC2GA4TA2GCAC5CT13CT11GA2CA22TC6CA44AT2GA1GT6AC3GT15TC5AC14GA2TACA-T1GTGC2GC1AC2AG1CGAGGACG1CTTG-G-G8GT8TA13AG17CT5GA2CA17CT20AG15TC19CT64GA19AGAT15GT5TC12AG20CG23GC10AG31CG6TG6-G-A-T-T-T-G-A-A-G4CA5TA-T-A-C2GA1GA3-G-T-A-G-C-G-G-G-A-G-A-A-T-G-A-T-A3CG1-G1CA2AG3AG21GA3AGTC4AGAC3GA8AGAT10CTGA4CT17GA2GA11GA6GCT-A-C-T-A-A-T-A-G-G-A-C-T-A-A-11GA5TC12TC14AG71GA3GAGAATGA4AGGAAC17TC5GC15CA17CT21TC7GA19GA14AG5ATAC3AT5AG6TC21AG2TCGAAC1AT5TGCA18TC1GA14GA3CA2AC1AG3GC-C-A-G-A-G-A14CA3TGAT1GA3CT4GA1A-A-T-7GA4AG2GAAC7GT4TA1CA1GT1AG2AGGAAG2GA1CA4GA1GA9CA1ACGA8AGAC6CAAGCAAG1GA6CG-G-A-A-A-T-A2GAGA1CA5GACTAC3GA22TA6AGCT2TC5CG30CT2CTAT2TA2GCCAGATC6GACTGA1GT2CT3ATAT1GAGA2CG1GA6CG2AC2CATAAGCGTG1GCGAGAGA3TC1TC2CA3TA1-G-T-G3ACTA5AC4AC16TA9GTAG6GA34AT3GC52CT1GA2AG2C-A-2A-A-A-T-G-G-T-G-G-C-G-A-G-A-A-T-G-G-G-A-C-C-C-A-G-A-T-T-G-G-C-G-A-G-4TA1AT2CG22GA32CT23GA9AG19AG32AGAGCG1TA1CA53GC8AG19TA21AG12CT7AG17AG32AG5TC34GA15AG39AG32AT8AC1AG6GAGAGTAC3TC18GC9GA7TC3GAAG7TC2AT11CG7GA5AG32GA12GA1CT15GA10CT18AT22TC2AG26GA11AG20CT11AG2CT7GA7GA2TC27CTCA2CA33GAGTATTCCG14TC3AG5CT6AGTA3CT8TC4TG14TA26CT1GA37GA26GA38TC5TC5TC1TC3TC3TG7GT5AG9AG9CT1AG5AG2AGTC12CTTCTGAC10CG3GA14AG6GACT23GT9-G-T-A-G-T-G3GTGT6GCTC1GA12AG6GA3AG1T-A-A-G-C-C-A-G-A-A-G-A-13AG2GA7GA15TC4GA3TC4CA3CA18TC6TC7AC2TGAT2TC20AG11CT10GC6AG28GC4CG7CT42TC9AG3GA21GA1TCCT16TCCT9GA25AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 -OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9719,635,1,634,9086,9719,0.0,755,91.811,583,plus,14TC9AG3GA21GA1TCCT16TCCT9GA25AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 -OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9719,637,9075,9710,1,636,0.0,749,91.366,582,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-11 +OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9718,9787,1,9708,1,9718,0.0,11355,90.835,8890,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC7A-32TC6TC5TGAGGA39-A17-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T-G-A-G7T-75CTACAG43CA1GACT28AG5GA5TC11CT17GA2GA17AG2GA2AG5GA2CAGT1TC25AG4CT3TA1CA33AG7GA1GA11AG11GC20GC14GA14CA12AC1TC1AG2GACT35GC5AG15CG2CA35AG7TG11TC8AG12AT37TC87TG1AG11GT9GA4GA9CA1AGCA4GA34AC9GA7CG10CA11GA16CT15CA1TC29CT5CTGATC17AG60TC5GA11TG35GA29GA8AG8AG6TC41AG7AG33GA5CT6GC27AG12CACT1AG13CT11GA5TC1TCTA2TC1AG23GA76GA11CTGA6GA14CT49TC5AT6GA9TC7AG1CA31GA10AG40AG26CT20TA13AG11AG6GA95GA50AG5CT32AG40GA43AGCT15AG14AG5CT36AG16GA5TCGA3AC54TC29TC2TA69AG1GA26AC8CT1CT27CT14GT53TC2GA35TC20AG8GA27GA13AG14AG4AG7TC67CT24TG28TC23AG8CT23AG2CT11GACT16GA23GAGA12CA30GA50TC12CA51AT21GA14AG3AG14AG32GA1TC42TC1AG24GA9TC30AG11CT21CT13GA2AG14GA11TC23TC5AG30GA1CT1AG19CA7GT24CT11CT19AG66AC1GA11AGCT6GA24GA14CT53GA59AT44CT15AG10GA14TC5CT9TC40TA11GA15CT2AG8AG61GA8AG11CT5CT2GA38AT21AG2AGAC1GATC5AG3TC17GA5AG11CA25AG4AG55AT36GA56AG28CT63GA28TC77TC2CT72GA14TC6CT2AG1AT3AG9AG1AGAGTA5GT21ACTC51AG25TA52GA3GA9AC17CA29TC5TC11GC14TG13GATCGA7TC30CA16GA12AG21GA2GT23GC50AG9TC11GA7AG11AG5AG1GA27AT5TC5AC2GA2AG2GA14AT62TC14AG21AG3AC2TG15GA6TG14CA35GA17TC14CT28AC5GC49TCCA3AGGAGA4GC12TC7CT27GA4TA2GCAC5CT13CT11GA2CA22TC6CA44AT2GA1GT6AC3GT15TC5AC14GA2TACA-T1GTGC2GC1AC2AG1CGAGGACG1CTTG-G-G8GT8TA13AG17CT5GA2CA17CT20AG15TC19CT64GA19AGAT15GT5TC12AG20CG23GC10AG31CG6TG6-G-A-T-T-T-G-A-A-G4CA5TA-T-A-C2GA1GA3-G-T-A-G-C-G-G-G-A-G-A-A-T-G-A-T-A3CG1-G1CA2AG3AG21GA3AGTC4AGAC3GA8AGAT10CTGA4CT17GA2GA11GA6GCT-A-C-T-A-A-T-A-G-G-A-C-T-A-A-11GA5TC12TC14AG71GA3GAGAATGA4AGGAAC17TC5GC15CA17CT21TC7GA19GA14AG5ATAC3AT5AG6TC21AG2TCGAAC1AT5TGCA18TC1GA14GA3CA2AC1AG3GC-C-A-G-A-G-A14CA3TGAT1GA3CT4GA1A-A-T-7GA4AG2GAAC7GT4TA1CA1GT1AG2AGGAAG2GA1CA4GA1GA9CA1ACGA8AGAC6CAAGCAAG1GA6CG-G-A-A-A-T-A2GAGA1CA5GACTAC3GA22TA6AGCT2TC5CG30CT2CTAT2TA2GCCAGATC6GACTGA1GT2CT3ATAT1GAGA2CG1GA6CG2AC2CATAAGCGTG1GCGAGAGA3TC1TC2CA3TA1-G-T-G3ACTA5AC4AC16TA9GTAG6GA34AT3GC52CT1GA2AG2C-A-2A-A-A-T-G-G-T-G-G-C-G-A-G-A-A-T-G-G-G-A-C-C-C-A-G-A-T-T-G-G-C-G-A-G-4TA1AT2CG22GA32CT23GA9AG19AG32AGAGCG1TA1CA53GC8AG19TA21AG12CT7AG17AG32AG5TC34GA15AG39AG32AT8AC1AG6GAGAGTAC3TC18GC9GA7TC3GAAG7TC2AT11CG7GA5AG32GA12GA1CT15GA10CT18AT22TC2AG26GA11AG20CT11AG2CT7GA7GA2TC31CA33GAGTATTCCG14TC3AG5CT6AGTA3CT8TC4TG14TA26CT1GA37GA26GA38TC5TC5TC1TC3TC3TG7GT5AG9AG9CT1AG5AG2AGTC12CTTCTGAC10CG3GA14AG6GACT23GT9-G-T-A-G-T-G3GTGT6GCTC1GA12AG6GA3AG1T-A-A-G-C-C-A-G-A-A-G-A-13AG2GA7GA15TC4GA3TC4CA3CA18TC6TC7AC2TGAT2TC20AG11CT10GC6AG28GC4CG7CT42TC9AG3GA21GA1TCCT16TCCT35AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 +OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9718,635,1,634,9085,9718,0.0,758,91.969,584,plus,14TC9AG3GA21GA1TCCT16TCCT35AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 +OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9718,637,9075,9710,1,636,0.0,749,91.366,582,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-11 OQ092464,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9556,8890,8917,592,9460,1,8890,0.0,10536,91.533,8162,plus,18TA2CT45T-TC11GTGAAG42CT27-A-C-T-G-G-T-G-A-G-T-A-C-G-C-C-A-A-T-T46GA34GA35AG10AG28GA20GT5AG6AG17TC13GA3GT5CA30AT13AGCT24CA2TG8CT5GA47AG19AG11AG2GA34AC22GAGC2AC31AG2AG13CG3CT1GA27GACT10AG5CT21CT4CT23TC17AC29TC5GA17GA5TCGC16AG5AT11CT5AT5TA7CA16GCGA11AGTC2TC6AG7AG23AC5GA7AC2AC1AC5AG1GA12AGCT7CT9GA6AG5GA2AC1CTCT25AT6TC6GCCTCT2AG14GA6AGAG12AC2AC2AG5CT1AC6AG5AC5CT5TCAT10AT2AG2AC4CGAGGC2AT4AT6AC3TC3ACGC1ATTG3AC16GA7AG14AT2AG12GATC5CG1CG3G-T-A-1CTAG12GA1GA1CT2-C7A-9AGGA1CT6GA5CT2CT14GA2TC5TC14TC5GA4GA21AG8CT11TC8GA22AGGA2CT17GA5AC8TC11AG9AT34AG15TC25AG3AC10AG10GA20CACA1CA6AG9GA3GA2AG1TC51GA1CA3AG7GA47GA10CA1GC3CTTC1GA4AC2CT8TC2AG4TC18AG35AG11TC2CT11TC102GA7CT23GA32TC29AG38AG10GA117AG2CA116TC100GA16AG8TC1AG14GA1AG42TC17AT59TC23GA5GA29CT16AG12AG17GA11AG3AG11AGGA24GA8AG39AT15TC22GT55AG10TC3AG11TA23GA15AG30CT6GA4GA1CT1AG8AG1GA3AG19CT81GA23GA17TG8CT5GA6TATA22AG22CTTC4AG2TG24TC10TC3CT20TG4AG20AC20TC37AG12AG17CA2GA2AC2CTCT73GA2AGGA34CG2TA27GT13CT15GA37CT3TC7GA44AG62TC35GA15CA53GA15CATC2AG14CT60GA16AG50GA8AG13AT3CT44GA2GA42TC20CA37CT26TG144GA8AC18AG5AG15AG1GAGAAT11GA11CA2TC26TA8GA11GT5GA3AG3CT3AT68GA1AG16GA9GA1TC19TC8CT46AG9TA5CG54GA8AG39AG34AC3CT53GA23CT8GA11CTAG7GA17AT5AG53TC7TA9GA4GA18CT1TC2AG2GA35TC13GA2TC5AG17TC6TACATA2TC2TC5GACA86GA6CA3CT16CT12GA9GT13ACCT7CA3GTCT23CT1AGTC22TA1TC5AG2CA23AG5GA1AG18TG38TC2GA5TC2AG8A-T-C-A-G-C-3TG5GA9TGGA27GA4AG5AC3TC15TC8AG18AT1TC5TCCT21AGAC3TGAT3TC23TC26CT8AG3GA9GA12GA21GA10AT2GA8GA26TC41GA13AGTG4ACCT2CT5TGATCTCG1CA1AGGC3C-A-A-8CA5CGC-A-C-T-A-C-3TA1GTCA1GA4AG1GA10GA1G-A-G-2AG18AG5AT8AG2GA5GA19CT10CT4AG11GA9AG3TA2TC4GCGATC6GA24GA23GA21GA17AC13CT8GA15TC16CT25GA51GAGA4AG20AGGA25TG9TA17AGTA25AG6CA1AC5CTCTAT11TG13CACA24CT7ACAC6AG3GA6AG1TA9GA1CA1AG4TG3AC3GA3AG11GAGAGA-A-A-T-C-A-A5GA7TC3TCAGCA2AT22GA2GA1AGACCT5AG3TC1AG15TC18AC1AG4TA8CA1TA4TG-C-A-G4CA2GA1TGAG-C-A-C6GTGA2GA1ATAG2TACGAT3GAACCT5CT1CA24GA12CATG39TC1GC4TGACCA4AG5CT9CT9CT2AT16G-A-A-A-9AG1CAAT1CTAG-T26AG55AG9AG55-A-A-C10GA52AG14GA7TA34CT25GA59GA29GA2AG26TC24GA22GA2ATCG1GA6GA1TC15GC1AG7GA19AG2TG9CA10AG2TG38GC4AG4ACAG24GA10GA17AG26GA29TC7CT36TC7AG11CA18AC1AG32GAAG9GAGT1CACG6GAAG1CT9AG4TC7TACA5GA53AG6AG32CGTC12GC34AG10AG4CT17CT17GA18GA2TG6GT1GACT1GT1GT6TA17AC22GA7TA13TC11GAAT4TCGA3TG3AG3CA5AG20GA-C-T-G-A-G-C-C-A-G-C-A-A30CT10CT19CT23CT8TC26TG5GA5TC2TC8GA32GA6GT50CT7AG11TG21CA10CA27CACA15GA14TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GA9TC5GA7AGTC3AG1GA3CA19CT5GA16CT8AT10GA20 OQ092464,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9556,8890,380,6,385,8511,8890,4.64e-128,456,91.842,349,plus,14CT7AG11TG21CA10CA27CACA15GA14TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GA9TC5GA7AGTC3AG1GA3CA19CT5GA16CT8AT10GA20 -OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9719,9751,61,9718,1,9719,0.0,11550,91.734,8945,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA5CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA185TC5AG6TGAGGA8AG45-G-A-G-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T13TA72ACAG27AG5AG3CA4CT12CA49TGCT4GA11GC30GT1TC21TC48AG7GA25GC2AG18CA17G-4-ATA18AC4AC1GACT33CA23CG1TCTA35AG28AG12AT53AG1AG2TG38TC27TG13GT9GA13AG43AC28CA25TA2CT17TC5GA30GATC3TC8TC4AG54GA14ATAT7AG5GA17TC3CT13AG2TC29AG8AG38GA2GA5AC5CT2AG42-G-C-T2TCGA28TC10CTAT32TC1TC3AC20AG26AG5GA60CT7GA25AG38TC5AT16TC12GA28GA9AGAG34AG11GA50TA4AG3AG7AG21AG45GA91CT2TC20TC8AG101AG14AG50TC14TC17GA65GA5TC35AG14CA9AG11AG16CT22CT92GAGA2AC5AG59GA20AG23AG19AG100AGAT15TC20CA14AG26TCGC4AG32GA5TC18GA12CA30GA17GA24AT1GA6CT11CA17AG1TC26AG26GA35GA30GA3TC27CT12TC1AG2TC8AG26CG26TG11CT17AG20AG26TC23TC2AG2AG4GA2CT3CA18GA16GA6CA7AT11CT44AG20GA18CT26AC1GA19GA24GA14CT63TG13GAAG20AGCA15TA7GA3CT5CT39AG2AG54CT18CT29GA15AG61GA8AG11CT5CT6CT22GA3GA7AT2TC18AG5GA6AG21GA17TA29CAAG40AG8GT99AG40GA8CT42GA1CT26TC68GA14AG69CA20AGCT4CT3AGAG8AG7GT10CT12AC1CT26TC5GA8AT8AG6GA40CT30GA6AG5TG18CA24CT4TC5TC11GC14TG3AT2GT6GATCTA11CAAG13AG28GA13TC12GA10GT23GC4TC39AG15TC1TC5GA23AG7GA27AT9AGAG6AG3TC1CT7CA19AG13TCTA31TC2-T12AG4AG16AG22GA57GA3CG46CT10AC52CG3CA3AG6GC13ATGT30TC6CTTA2GCTC4TG26GACT22AT7GATA1AC32GA5TC2CGAT5AG5AC3GT39T-C-A-G-G-2GT1A-T-T-G-2GA18C-A-C-C-A-T-5AG21AG22AC4CA16TC23AG15TC14AG16CTCA7GA41TC15CGCT5AT21TC12AG25CT24TC36TG6TG6AG2GT1-G-A-A5TA5CA2AC5AG6TCAG1T-3GA1ATCG1GT-A6GATA6AG23TCGACG6AC4AG1AGAG4AG1AGAC14CT5AT3GA7GA2GA10GTGA6AC3AC7TA5TC2AG6TC10CT22AT7AG41AT12GA4AG1AC23ACCA34AG9GA23TC18AG5GA9ATAC9AG31TC1AC1AT2AG15TC12TC14TA2-C-C-G-T3TCTATG1-G1-G4GA3CAAG4AT2TGAT1GA3CT2AG1GA1C-A-T-12AG23GT3AGAC1GA1CA3GA4ACGA5GA5GA3TC1GACGAC18-G-G-A2GT12GA7TG14AG16TC3TC13CG21CTAT5AC1GA18ATA-T-G-6AGCT3CT3AG1-A-C-T-G-A-A-G-G-G-T-C-A4CATC5TAAGAGTA2-T-G-A3CA5TC5GA25GTAG6GA22TC10AGAT2GA7AG22TC1AGTC20GATACTCA2GAA-G-G-4CT1CACGCT1TC8TC26TC44GA11GA32AG4GA12AGAGCGGACA1GA6AT46GC26GA36CT29AC44GA20TC2CA16AG44AG9AG20TC5AC10ATAC3TC18GC1AG21GCATCT4TC2AT43GA14GA5GA24GA10CT18AT7CA14TCAT1AG5GT15AG4GA41GA2AG2CT7GA1TC5GA1TC11AC16CT37GAGTGT1AG14TC3TG2GA14CT4AG23GA28GA24AG12GA26GA5CT20GT11TC5TC11TC45AG2AGTC1GT12TG6CA23AG6GACT32TA5CG2GA11GA2AG26C-C-A-G-C-T-11ATGA23TC17CA6CG3TC13ACTC20GA17AG8GT10GC33AG1GC4AG1GA6GA41TC6CA2AG9AT15GA30GA9TC15AGCTTC9TC1AG16TA25-A-A-G-A-T-A1-A-A-G-A-G-G-C-C-A-A-T-A10TC1GC1TA1TC3CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2TC2-G16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 -OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9719,636,59,675,9084,9719,0.0,705,88.994,566,plus,16TC6CA2AG9AT15GA30GA9TC15AGCTTC9TC1AG16TA23-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G-C-C-A2GA10TC1GC1TA5CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 -OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9719,636,9104,9720,1,636,0.0,699,88.836,565,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA1TC3CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA168 +OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9718,9750,61,9718,1,9718,0.0,11560,91.764,8947,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA5CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA185TC5AG6TGAGGA8AG45-G-A-G-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T13TA72ACAG27AG5AG3CA4CT12CA49TGCT4GA11GC30GT1TC21TC48AG7GA25GC2AG18CA17G-4-ATA18AC4AC1GACT33CA23CG1TCTA35AG28AG12AT53AG1AG2TG38TC27TG13GT9GA13AG43AC28CA25TA2CT17TC5GA30GATC3TC8TC4AG54GA14ATAT7AG5GA17TC3CT13AG2TC29AG8AG38GA2GA5AC5CT2AG42-G-C-T2TCGA28TC10CTAT32TC1TC3AC20AG26AG5GA60CT7GA25AG38TC5AT16TC12GA28GA9AGAG34AG11GA50TA4AG3AG7AG21AG45GA91CT2TC20TC8AG101AG14AG50TC14TC17GA65GA5TC35AG14CA9AG11AG16CT22CT92GAGA2AC5AG59GA20AG23AG19AG100AGAT15TC20CA14AG26TCGC4AG32GA5TC18GA12CA30GA17GA24AT1GA6CT11CA17AG1TC26AG26GA35GA30GA3TC27CT12TC1AG2TC8AG26CG26TG11CT17AG20AG26TC23TC2AG2AG4GA2CT3CA18GA16GA6CA7AT11CT44AG20GA18CT26AC1GA19GA24GA14CT63TG13GAAG20AGCA15TA7GA3CT5CT39AG2AG54CT18CT29GA15AG61GA8AG11CT5CT6CT22GA3GA7AT2TC18AG5GA6AG21GA17TA29CAAG40AG8GT99AG40GA8CT42GA1CT26TC68GA14AG69CA20AGCT4CT3AGAG8AG7GT10CT12AC1CT26TC5GA8AT8AG6GA40CT30GA6AG5TG18CA24CT4TC5TC11GC14TG3AT2GT6GATCTA11CAAG13AG28GA13TC12GA10GT23GC4TC39AG15TC1TC5GA23AG7GA27AT9AGAG6AG3TC1CT7CA19AG13TCTA31TC14AG4AG16AG22GA57GA3CG46CT10AC52CG3CA3AG6GC13ATGT37CTTA2GCTC4TG26GACT22AT7GATA1AC32GA5TC2CGAT5AG5AC3GT39T-C-A-G-G-2GT1A-T-T-G-2GA18C-A-C-C-A-T-5AG21AG22AC4CA16TC23AG15TC14AG16CTCA7GA41TC15CGCT5AT21TC12AG25CT24TC36TG6TG6AG2GT1-G-A-A5TA5CA2AC5AG6TCAG1T-3GA1ATCG1GT-A6GATA6AG23TCGACG6AC4AG1AGAG4AG1AGAC14CT5AT3GA7GA2GA10GTGA6AC3AC7TA5TC2AG6TC10CT22AT7AG41AT12GA4AG1AC23ACCA34AG9GA23TC18AG5GA9ATAC9AG31TC1AC1AT2AG15TC12TC14TA2-C-C-G-T3TCTATG1-G1-G4GA3CAAG4AT2TGAT1GA3CT2AG1GA1C-A-T-12AG23GT3AGAC1GA1CA3GA4ACGA5GA5GA3TC1GACGAC18-G-G-A2GT12GA7TG14AG16TC3TC13CG21CTAT5AC1GA18ATA-T-G-6AGCT3CT3AG1-A-C-T-G-A-A-G-G-G-T-C-A4CATC5TAAGAGTA2-T-G-A3CA5TC5GA25GTAG6GA22TC10AGAT2GA7AG22TC1AGTC20GATACTCA2GAA-G-G-4CT1CACGCT1TC8TC26TC44GA11GA32AG4GA12AGAGCGGACA1GA6AT46GC26GA36CT29AC44GA20TC2CA16AG44AG9AG20TC5AC10ATAC3TC18GC1AG21GCATCT4TC2AT43GA14GA5GA24GA10CT18AT7CA14TCAT1AG5GT15AG4GA41GA2AG2CT7GA1TC5GA1TC11AC17AC36GAGTGT1AG14TC3TG2GA14CT4AG23GA28GA24AG12GA26GA5CT20GT11TC5TC11TC45AG2AGTC1GT12TG6CA23AG6GACT32TA5CG2GA11GA2AG26C-C-A-G-C-T-11ATGA23TC17CA6CG3TC13ACTC20GA17AG8GT10GC33AG1GC4AG1GA6GA41TC6CA2AG9AT15GA40TC15AGCTTC9TC1AG16TA25-A-A-G-A-T-A1-A-A-G-A-G-G-C-C-A-A-T-A10TC1GC1TA1TC3CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2TC2-G16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 +OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9718,636,59,675,9083,9718,0.0,708,89.151,567,plus,16TC6CA2AG9AT15GA40TC15AGCTTC9TC1AG16TA23-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G-C-C-A2GA10TC1GC1TA5CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 +OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9718,636,9104,9720,1,636,0.0,699,88.836,565,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA1TC3CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA168 diff --git a/tests/expected-results-large-csv/errors.csv b/tests/expected-results-large-csv/errors.csv index 9c9b3a6..4177f70 100644 --- a/tests/expected-results-large-csv/errors.csv +++ b/tests/expected-results-large-csv/errors.csv @@ -1,179 +1,124 @@ sequence_name,error,message KX505501.1,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 2721" -KX505501.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6323 +KX505501.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6322 KX505501.1,InsertionInOrf,"Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" -KX505501.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 195 positions. -KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893 -KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5969-6047 contains an internal stop codon at 6005 -KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 40 positions. -KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 96" -KX505501.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1116" +KX505501.1,DeletionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" +KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 +KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004 +KX505501.1,FrameshiftInOrf,Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions. +KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions. +KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" +KX505501.1,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" KX505501.1,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. KX505501.1,LongDeletion,Query sequence contains a long deletion. KX505501.1,Scramble,Sequence is plus-scrambled. -MN691959,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MN691959,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" +MN691959,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123 +MN691959,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 MN692074,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 981" -MN692074,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6551 +MN692074,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6550 MN692074,DeletionInOrf,"Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" -MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5843 can have maximum insertions 90, got 261" -MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893 -MN692074,InsertionInOrf,"Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 108" -MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 76 positions. -MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 204" -MN692074,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1131" +MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" +MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 +MN692074,InsertionInOrf,"Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" +MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions. +MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" +MN692074,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" MN692074,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. MN692074,LongDeletion,Query sequence contains a long deletion. -MN692145,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MN692145,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 231" MN090335,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 822 -MN090335,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MN090335,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 282" +MN090335,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 MN090335,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 42 deletions with max tolerance of 10 deletions. MN090335,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, AT." MN090335,Scramble,Sequence is minus-scrambled. MN090335,InternalInversion,Sequence contains an internal inversion. MN090376,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 822 -MN090376,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MN090376,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 252" MN090376,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 95 deletions with max tolerance of 10 deletions. MN090376,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MN090376,Scramble,Sequence is minus-scrambled. MN090376,InternalInversion,Sequence contains an internal inversion. -MK115581.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115581.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK115690.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115690.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" MK115690.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 12 deletions with max tolerance of 10 deletions. MK115690.1,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, G-." -MK115571.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115571.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" +MK115690.1,Scramble,Sequence is plus-scrambled. MK115571.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 79 deletions with max tolerance of 10 deletions. MK115571.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -MK115514.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115514.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" MK115514.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -MK115488.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115488.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" MK115488.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -MK115030.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115030.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 270" MK115030.1,Scramble,Sequence is minus-scrambled. MK115030.1,InternalInversion,Sequence contains an internal inversion. -MK115498.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115498.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK115211.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6890 -MK115211.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115211.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 252" +MK115211.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6889 MK115211.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 20 deletions with max tolerance of 10 deletions. MK115211.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115211.1,Scramble,Sequence is minus-scrambled. MK115211.1,InternalInversion,Sequence contains an internal inversion. MK115158.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 20 deletions with max tolerance of 10 deletions. MK115158.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -MK114705.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 74 positions. -MK114705.1,FrameshiftInOrf,Smaller ORF nef at 8796-9417 contains out of frame indels that impact 122 positions. +MK114705.1,DeletionInOrf,"Smaller ORF nef at 8795-9416 can have maximum deletions 30, got 186" MK114856.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 873 MK114856.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2213 -MK114856.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6326 +MK114856.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6325 MK114856.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5172 -MK114856.1,InternalStopInOrf,Smaller ORF vpr at 5558-5843 contains an internal stop codon at 5594 -MK114856.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5920 -MK114856.1,FrameshiftInOrf,Smaller ORF vpu at 6259-6310 contains out of frame indels that impact 67 positions. -MK114856.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434 -MK114856.1,InternalStopInOrf,Smaller ORF nef at 8796-9417 contains an internal stop codon at 8853 -MK114856.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 4.399685326687554e-65). +MK114856.1,InternalStopInOrf,Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5594 +MK114856.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5919 +MK114856.1,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126 +MK114856.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 +MK114856.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 +MK114856.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8852 +MK114856.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 3.639064030015132e-65). MK115009.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 834 MK115009.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2183 -MK115009.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6350 +MK115009.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6349 MK115009.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5373 -MK115009.1,DeletionInOrf,"Smaller ORF vpr at 5558-5843 can have maximum deletions 30, got 75" -MK115009.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5860 -MK115009.1,InsertionInOrf,"Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 177" -MK115009.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434 -MK115009.1,InternalStopInOrf,Smaller ORF nef at 8796-9417 contains an internal stop codon at 8874 -MK115009.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 1.3731449337509935e-41). +MK115009.1,InternalStopInOrf,Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5717 +MK115009.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859 +MK115009.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 +MK115009.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873 +MK115009.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 1.2040967664149076e-41). MK115009.1,Scramble,Sequence is minus-scrambled. MK115009.1,InternalInversion,Sequence contains an internal inversion. -MK115387.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115387.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 279" -MK115491.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115491.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" +MK115387.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 MK116110.1,InternalStopInOrf,ORF gag at 140-1643 contains an internal stop codon at 185 MK116110.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 22 deletions with max tolerance of 10 deletions. MK116110.1,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, CC." -MK115527.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115527.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK114997.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6512 -MK114997.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK114997.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 270" -MK115518.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115518.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK115065.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115065.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 270" +MK114997.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6511 MK115065.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 75 deletions with max tolerance of 10 deletions. MK115065.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115065.1,Scramble,Sequence is plus-scrambled. MK115065.1,InternalInversion,Sequence contains an internal inversion. MK115464.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 924 MK115464.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2183 -MK115464.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6425 +MK115464.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6424 MK115464.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5247 -MK115464.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115464.1,FrameshiftInOrf,Smaller ORF tat_exon1 at 5830-6046 contains out of frame indels that impact 104 positions. -MK115464.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434 -MK115464.1,FrameshiftInOrf,Smaller ORF nef at 8796-9417 contains out of frame indels that impact 393 positions. -MK115464.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 5.391006513622446e-23). -MK115530.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115530.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" +MK115464.1,FrameshiftInOrf,Smaller ORF tat_exon1 at 5829-6045 contains out of frame indels that impact 104 positions. +MK115464.1,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126 +MK115464.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 +MK115464.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 +MK115464.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873 +MK115464.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 4.937891251407691e-23). MK115520.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2198 -MK115520.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115520.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" MK115520.1,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, GA." MK115520.1,InternalInversion,Sequence contains an internal inversion. -MK115503.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115503.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK115570.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115570.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" MK115570.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 11 deletions with max tolerance of 10 deletions. MK115570.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -MK115509.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115509.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK115702.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 74 positions. -MK115702.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" MK115702.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 54 deletions with max tolerance of 10 deletions. MK115702.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115702.1,Scramble,Sequence is plus-scrambled. MK115702.1,InternalInversion,Sequence contains an internal inversion. MK115095.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 927 MK115095.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2183 -MK115095.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6551 +MK115095.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6550 MK115095.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5151 -MK115095.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MK115095.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5860 -MK115095.1,FrameshiftInOrf,Smaller ORF vpu at 6259-6310 contains out of frame indels that impact 43 positions. -MK115095.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434 -MK115095.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 213" -MK115095.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 9.460464921885922e-40). -MK115490.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115490.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -MK115576.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MK115576.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" -OQ092466,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -OQ092466,InsertionInOrf,"Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 195" -OQ092466,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 261" +MK115095.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859 +MK115095.1,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126 +MK115095.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 +MK115095.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873 +MK115095.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 8.33506116803153e-40). OQ092466,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, GC." OQ092463,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 26 deletions with max tolerance of 10 deletions. OQ092463,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." OQ092465,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, GA." -OQ092462,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -OQ092462,InsertionInOrf,"Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 195" -OQ092462,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 255" OQ092462,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 23 deletions with max tolerance of 10 deletions. OQ092462,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." OQ092464,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 19 deletions with max tolerance of 10 deletions. OQ092464,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -OQ092467,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -OQ092467,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 237" OQ092467,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 22 deletions with max tolerance of 10 deletions. OQ092467,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." diff --git a/tests/expected-results-large-csv/holistic.csv b/tests/expected-results-large-csv/holistic.csv index fc0954a..86f159e 100644 --- a/tests/expected-results-large-csv/holistic.csv +++ b/tests/expected-results-large-csv/holistic.csv @@ -1,42 +1,42 @@ seqid,qlen,hypermutation_probablility,inferred_subtype,blast_matched_qlen,blast_sseq_coverage,blast_qseq_coverage,blast_sseq_orfs_coverage,orfs_start,orfs_end,blast_n_conseqs -KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498199403230785,1.2158237356034052,0.17661753684736448,789,8795,4 -MN691959,9493,0.19593905853945925,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0816956477003807,1.1086063415148004,1.0,789,8795,3 -MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5041670953801831,1.1728099569171853,0.41144141893579816,789,8795,4 -MN692145,9689,0.1661041079701131,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.1304660973351168,1.1271545051088863,1.0,789,8795,3 -MN090335,9069,0.1754017863888554,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842576396748637,1.0603153600176425,1.0003747189607795,789,8795,3 -MN090376,8985,0.026007919521734202,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,8985,0.9784957300133759,1.0604340567612687,0.9943792155883088,789,8795,3 -MK115581.1,9495,0.6897199265079494,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9495,0.9870357032616525,1.0046340179041602,1.0,789,8795,2 -MK115690.1,9689,0.05065930954004094,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,0.988167506945159,0.9949427185468056,1.0,789,8795,2 -MK115571.1,9394,0.8012585672082311,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9394,0.9866241382858318,1.0113902490951672,1.0,789,8795,2 -MK115514.1,9382,0.6458974386368621,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9382,0.9864183557979216,1.0173736943082499,1.0,789,8795,2 -MK115488.1,9623,0.6511896911074662,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9623,1.0255170285008746,1.0325262392185388,1.0,789,8795,6 -MK115030.1,9126,0.031598631869680704,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9126,0.9940323078506019,1.0655270655270654,1.0,789,8795,3 -MK115498.1,9461,0.8339748776671196,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9461,0.9866241382858318,1.0080329774865235,1.0,789,8795,2 -MK115211.1,9032,0.11689558806708,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9032,0.9950612202901533,1.0598981399468557,1.0,789,8795,3 +KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498456472525211,1.2158237356034052,0.17663960024984385,789,8794,4 +MN691959,9493,0.19667690182893238,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0817040543321672,1.1086063415148004,1.0,789,8794,3 +MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5042189750977567,1.1728099569171853,0.4114928169893816,789,8794,4 +MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8794,3 +MN090335,9069,0.1771850809736527,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842560197571517,1.0603153600176425,1.0003747657713928,789,8794,3 +MN090376,8985,0.026415767987601813,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,8985,0.9784935171846059,1.0604340567612687,0.9943785134291068,789,8794,3 +MK115581.1,9495,0.6919440876652894,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9495,0.987034369211772,1.0046340179041602,1.0,789,8794,2 +MK115690.1,9689,0.051230576250981485,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.004630582424367,1.0113530808132933,1.0,789,8794,3 +MK115571.1,9394,0.8029570594372466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9394,0.9866227618851615,1.0113902490951672,1.0,789,8794,2 +MK115514.1,9382,0.6482462132632603,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9382,0.9864169582218564,1.0173736943082499,1.0,789,8794,2 +MK115488.1,9623,0.6534999185838631,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9623,1.0255196542498457,1.0325262392185388,1.0,789,8794,6 +MK115030.1,9126,0.032014462397289556,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9126,0.994031693764149,1.0655270655270654,1.0,789,8794,3 +MK115498.1,9461,0.83547963060225,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9461,0.9866227618851615,1.0080329774865235,1.0,789,8794,2 +MK115211.1,9032,0.11818291879607423,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9032,0.995060712080675,1.0598981399468557,1.0,789,8794,3 MK115158.1,9143,0.002572269807584293,Ref.47_BF.ES.08.P1942.GQ372987,9143,0.9921577414295317,0.9699223449633599,1.0,234,8212,1 -MK114705.1,9411,0.14449377496074622,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9411,1.0980553554892478,1.122622463075125,1.0,789,8795,6 -MK114856.1,9477,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9477,1.0485646671468258,1.0812493405085997,1.0,789,8795,4 -MK115009.1,9207,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9207,0.9965016977055252,1.0590854784403172,1.0,789,8795,3 -MK115387.1,9136,0.5412311092694289,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9136,0.9796275336968824,1.040936952714536,1.0,789,8795,2 -MK115491.1,9422,0.8951015182445495,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9422,1.003704084782385,1.0299299511780937,1.0,789,8795,2 +MK114705.1,9411,0.14584270737492833,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9411,1.098065445564931,1.122622463075125,1.0,789,8794,6 +MK114856.1,9477,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9477,1.0485696645400289,1.0812493405085997,1.0,789,8794,4 +MK115009.1,9207,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9207,0.9965013377238114,1.0590854784403172,1.0,789,8794,3 +MK115387.1,9136,0.5436355526687852,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9136,0.9796254373327845,1.040936952714536,1.0,789,8794,2 +MK115491.1,9422,0.8961809048805741,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9422,1.0037044659394938,1.0299299511780937,1.0,789,8794,2 MK116110.1,8967,0.07021438897893317,Ref.B.TH.90.BK132.AY173951,8967,0.9957759004001778,0.9972119995539199,0.998622244488978,140,8124,3 -MK115527.1,9481,0.7689834393883834,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9481,0.986727029529787,1.0056956017297753,1.0,789,8795,2 -MK114997.1,9055,0.054959132555391754,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9055,0.9784957300133759,1.0516841524019878,1.0,789,8795,2 -MK115518.1,9537,0.6385326595592609,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9537,0.9847720958946393,0.9996854356715948,1.0,789,8795,3 -MK115065.1,9214,0.033517722768753644,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9214,1.0080255170285009,1.069459518124593,1.0,789,8795,6 -MK115464.1,9663,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9663,0.9838460746990431,0.9893407844354756,1.0,789,8795,2 -MK115530.1,9544,0.5789377103398377,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9544,0.9866241382858318,0.9992665549036044,1.0,789,8795,2 -MK115520.1,9589,0.5200353682902832,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9589,0.9787015125012861,0.987902805297737,1.012115913065201,789,8795,3 -MK115503.1,9617,0.4263025132504157,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9617,0.9870357032616525,0.9953207861079338,1.0,789,8795,2 -MK115570.1,9485,0.738578434638724,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9485,0.9866241382858318,1.0057986294148655,1.0,789,8795,2 -MK115509.1,9353,0.7866198309713798,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9353,0.9866241382858318,1.0197797498128942,1.0,789,8795,2 -MK115702.1,9098,0.14401391767451666,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9098,0.987447268237473,1.0596834469114091,1.019860104921309,789,8795,4 -MK115095.1,9137,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9137,0.9907397880440375,1.060085367188355,1.0,789,8795,2 -MK115490.1,9347,0.8863248655310947,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9347,0.9848749871385946,1.0204343639670483,1.0,789,8795,3 -MK115576.1,9266,0.818189227062389,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9266,0.9917687004835889,1.0342110943233327,1.0,789,8795,3 -OQ092466,9686,0.3876036547663967,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9686,1.1015536577837226,1.1192442700805285,1.0,789,8795,3 +MK115527.1,9481,0.770862998910788,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9481,0.9867256637168141,1.0056956017297753,1.0,789,8794,2 +MK114997.1,9055,0.05560625344150194,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9055,0.9784935171846059,1.0516841524019878,1.0,789,8794,2 +MK115518.1,9537,0.6408152618300496,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9537,0.9847705289154147,0.9996854356715948,1.0,789,8794,3 +MK115065.1,9214,0.033954952452739495,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9214,1.0080263428689031,1.069459518124593,1.0,789,8794,6 +MK115464.1,9663,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9663,0.9838444124305412,0.9893407844354756,1.0,789,8794,2 +MK115530.1,9544,0.5812621948015355,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9544,0.9866227618851615,0.9992665549036044,1.0,789,8794,2 +MK115520.1,9589,0.5225247969864292,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9589,0.9786993208479111,0.987902805297737,1.0121174266083697,789,8794,3 +MK115503.1,9617,0.42870398270204335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9617,0.987034369211772,0.9953207861079338,1.0,789,8794,2 +MK115570.1,9485,0.7406166892211931,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9485,0.9866227618851615,1.0057986294148655,1.0,789,8794,2 +MK115509.1,9353,0.7883768413537747,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9353,0.9866227618851615,1.0197797498128942,1.0,789,8794,2 +MK115702.1,9098,0.1454272422215308,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9098,0.9874459765383824,1.0596834469114091,1.0198625858838226,789,8794,4 +MK115095.1,9137,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9137,0.9907388351512657,1.060085367188355,1.0,789,8794,2 +MK115490.1,9347,0.8875203448314265,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9347,0.9848734307470673,1.0204343639670483,1.0,789,8794,3 +MK115576.1,9266,0.8197662757563093,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9266,0.9917678534677917,1.0342110943233327,1.0,789,8794,3 +OQ092466,9686,0.3858261890626,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9686,1.1015641078411196,1.1192442700805285,1.0,789,8794,3 OQ092463,9605,0.21628713708846803,Ref.B.TH.90.BK132.AY173951,9605,1.0529124055135617,0.9884435190005205,1.0,140,8124,2 OQ092465,9659,0.02412789935966586,Ref.28_BF.BR.99.BREPM12817.DQ085874,9659,1.0429696287964005,0.9620043482762191,1.0,200,8208,2 -OQ092462,9714,0.10777665573070194,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9714,1.130671879823027,1.1301214741610048,1.0,789,8795,3 +OQ092462,9714,0.10883643311676816,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9714,1.1306853261988064,1.1301214741610048,1.0,789,8794,3 OQ092464,9556,0.006887768010151674,Ref.28_BF.BR.99.BREPM12817.DQ085874,9556,1.0427446569178853,0.9678735872750105,1.0,200,8208,2 -OQ092467,9936,0.6416537859942263,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9936,1.1308776623109373,1.0962157809983897,1.0,789,8795,3 +OQ092467,9936,0.6438715160567257,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9936,1.1308911298621116,1.0962157809983897,1.0,789,8794,3 diff --git a/tests/expected-results-large-csv/intact.fasta b/tests/expected-results-large-csv/intact.fasta index e69de29..2d494f4 100644 --- a/tests/expected-results-large-csv/intact.fasta +++ b/tests/expected-results-large-csv/intact.fasta @@ -0,0 +1,1754 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA +>MK115581.1 +AAATTGGGACGTTCGCCTACGCAAGCGAAAATTTCTCTACGTAGCCACCTTTCCCGATTA +ACGTCAGAACCCTAAAATTAAAATAAATCCTAGCGGCCGACCGACTCTGGTAACTAGAGA +TCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC +TCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACA +GACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAATCATCTT +AGAGTGGCGCCCGAACGACTCTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGT +GGCGCCCGCGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCG +AGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGACT +CTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGACACAGGTACTA +GAGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG +CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAG +CGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAG +ATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATT +TAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACAT +CAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAG +AACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGG +TACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAA +AGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCA +TAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATG +CATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAG +CATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGAC +ATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATA +GATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAA +GTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATC +CACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAG +TAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTA +GAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAA +AAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTT +TAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGG +GGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTA +ATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATT +GTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGA +AATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAG +GGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGC +CAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGA +AGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCA +GCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGG +AGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGAT +AGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTG +TGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAG +AAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGT +ACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGA +AGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTC +AAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAG +TACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTG +GGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGT +ACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATAC +TGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGT +GCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTT +AGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTA +TGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACA +TCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCT +TTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGA +AAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAG +TCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGC +ACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGA +AATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGA +AGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAA +TCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATT +AACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAA +ATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGC +CACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCA +ATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAG +AGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTC +CCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGA +TTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGC +ACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAA +GGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGT +AGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGC +CCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATAT +ACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGA +GGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCT +AGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGT +TATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATG +GCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGC +CGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCA +AGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCA +GGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAA +AGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCT +ACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAG +GGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGC +AGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCAT +TAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGA +TTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGAT +GGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCC +CACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAG +AATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAG +TTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAAT +CTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAG +GACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGA +GAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACC +AGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGA +ACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACA +TATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCA +ACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCC +ACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAG +GAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCC +AAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGC +GACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAG +TATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAA +TAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAA +GGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTG +AAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATG +TTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTA +TGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAG +GCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTA +GGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATG +CATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCA +CTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAG +GAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGA +AATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAT +GATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCA +AAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTA +AAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAA +TGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCA +GAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTA +CATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGT +ATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGA +CAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAA +AAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGAC +CCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACA +CAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGA +AACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAA +GCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTA +CTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGA +GATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCA +TTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTG +GGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCG +TCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAAC +AATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATC +AAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTG +GGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGT +TGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGA +GAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAG +GAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTT +AACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATA +GGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCA +CCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATC +GAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTG +GCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGAC +TTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTC +AAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGC +TTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTA +CAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGG +GCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGT +AAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGA +CCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGC +CTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCC +TTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGG +GGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTA +CAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATA +TCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCA +AGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAA +AGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAA +GCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTG +GGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGC +TGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGC +CTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTG +CACTCAAGGCAAGCT +>MK115498.1 +AACACGGAATGGGAGATAAGCAGCATCTCTATCGGCGCGGCGAGATCTGACACTGGTAAC +TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC +CCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCCTAAATCTC +TAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTG +GCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC +TCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGAC +TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAA +CTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACTAGAGATCCCT +CACCCTAGATCTCTAGCAGTGGCGCCCGCGAAGGCACTAGGACCTGAAAGCGAAAGTAAA +ACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGA +GGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGA +GAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATT +CGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGG +GAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAA +ATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTT +AATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAA +GCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCA +GCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAG +GGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTA +GAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCC +ACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAA +ATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAT +GCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACT +ACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGA +GAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCT +ACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGG +TTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAA +ACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCA +GCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAA +GCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGA +GGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCAC +ATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGA +CATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCC +CACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAA +GAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGAC +AAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAA +TAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTAT +TAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTT +TTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAG +GTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGC +TTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGC +CAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCAT +TAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAA +ATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAAT +TAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAA +TACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATG +CATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTA +GTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGA +AAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGC +AAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAG +AAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGAC +TTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAAC +TCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTG +TCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGA +TTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTAC +CACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAG +TACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCA +ATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAAT +ATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAA +AGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATAC +AAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGT +GGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCA +TAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCA +AAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAA +ATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAA +ACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTG +AATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGG +CATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTA +CTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGA +AATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAA +AAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAG +TAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCC +TGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAG +GGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATAC +ATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAG +GGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCA +TGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGA +CAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGT +ATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTAC +AGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCAC +TTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATA +ATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAAC +AGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGT +TTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCAC +TATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGA +TTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAG +GGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCA +GACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCC +ATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGC +TCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTA +CCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCAC +AGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGG +TTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATG +GGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTC +ATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAA +ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACT +CCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAA +AAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAA +GGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCT +CTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGG +ACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATT +GATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAA +TTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGC +TACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACAC +CACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGC +CACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGAC +AGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAA +TTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAA +TTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGA +AGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGA +ATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATAC +ATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCC +AATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAA +GTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAA +GCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAAT +TAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTAT +ACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGG +AAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCT +TAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATA +TGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCA +TACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTAC +TTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATG +CAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCC +CATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGG +TGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTG +GAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCAC +CAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTT +CCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGT +ACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTAT +TGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAG +AGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTC +TGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCT +GAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACAC +AGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGA +ATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCT +GTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTT +TGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGAC +CCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGA +AAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGA +CCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAAC +AAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCT +CCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGC +CATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGC +TCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGG +GGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGAC +GAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAG +CAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAG +AAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTT +TCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAA +TTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACT +TCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGT +GGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCT +TGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGA +AGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACA +AAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAG +GTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGC +GTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCT +AACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115491.1 +CTGATTTGCTGTGGCGGCCGCAAGGACTCAAGTAGGTAACTATAGAAACCCCCCACCAAT +TCTCTAGCAGTGGCGTCCGACGCTGGCCAAAACTCTCTAGCAGTGGCGCCCGAACAGACT +CTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAG +ATCCCAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATC +TCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTG +GCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCGCCC +GACTCTGGTAACTAGAGATCCCTCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTA +GAGACTCAGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACG +CCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAA +TATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGA +AAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTA +ACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCAT +CCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATT +GTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAG +AGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAA +ACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCC +TATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAG +AAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCA +TGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATG +AGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCC +AGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAA +TAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAA +TCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAAC +AAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTG +AGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGA +ATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGA +TGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAA +TGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAA +AGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCC +CTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAG +AGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACT +TCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAG +AGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTT +CCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAA +AGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGG +AAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGA +TCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTAC +ACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCC +CATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGT +TAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAAT +GGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATT +TGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAA +TAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAA +AAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGA +TAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGG +GATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCA +AAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTA +TCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAA +AATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACA +TCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGT +ACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGT +GGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAA +ACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCT +AGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCC +ATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAAT +TTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCA +CACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGT +AATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATG +GTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCC +CTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTA +TGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAG +AGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGC +AATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATA +TACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGAT +AATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGG +AATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATT +TCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGC +AATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGA +TAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATG +GCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAG +TGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCT +CCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTT +CACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCAT +TCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAAT +TATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATT +CATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGT +AGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCA +AAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCT +TCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCC +AAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGT +GGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATG +TTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAA +TAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGG +GCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAA +AAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATT +ACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTC +CTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAA +AAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAG +AGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATG +GACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTG +GCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGA +GGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACA +TAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGAC +TAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTA +AAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATG +GCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATT +CTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAG +GATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATA +GGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAA +AAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGG +GGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACA +GTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGAT +GCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACA +GACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAA +AATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAG +CCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACT +AATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTC +AATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTT +GATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCA +GTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCC +CCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGT +AAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTA +CTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAAC +AATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCC +AACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGA +GCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAAT +ACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTT +AATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAA +TTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGG +AATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAAC +AGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGT +TCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAG +ACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATAT +AAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTG +CAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCA +GGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCT +GGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTG +CAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATAC +CTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACT +GCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATG +ACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATT +GAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGG +GCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATA +ATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAAT +AGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGA +CCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTT +CGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTC +CTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGA +CGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAG +CTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACA +GATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGA +ATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAG +TGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGG +GGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGC +AGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTT +TCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAG +CCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGA +TATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACAC +ACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGT +GGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCA +TGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATT +TCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTT +CTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGG +GAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCT +CTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAA +GCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC +GCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACTCTGG +TA +>MK115527.1 +ACCTATTACAGCCCATAAAGAGGAGAAACGAACATAAAGCTAGTGCAAACCTGACTGCCC +GAGGCAGGGAGCTAGAGTTAGGTAACTAAAGCTCAATCACTAGCGCTCGAGCATGAGGGA +CTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACATAAATCTCT +AGCAGTGGCGCCCTAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAG +CAGTGGCGCCCGAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCA +GTGGCGCCCGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGA +ACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAAC +ATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACAT +GACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGCGCGACATGAGGCTCGGT +AACTAGAGATCCTCAGTAAATCCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAA +GCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGAC +TAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAAT +TAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAAC +ATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAA +CATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAG +AAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAC +AGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGA +AAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACC +CCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAA +ATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTT +CAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGG +GACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGG +ATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGG +GAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATA +ATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAA +TAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCT +TTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGG +TAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTA +TTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAG +TGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAG +CTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCA +ATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTT +GGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTT +TAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAG +AGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTC +AGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTG +GCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATAC +AGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAAT +GATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAAT +CTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGG +AAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAAC +TGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGAC +AGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAAT +TTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGA +CAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTT +TTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAAC +AGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTA +TACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAA +TGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAAT +CTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTT +GTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACA +ACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATT +CCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCC +AGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGC +AAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAA +AGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAG +GGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGC +AGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAA +AAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACA +ATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCC +TAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCA +AGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTA +CCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAA +TAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTAT +CTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCA +GGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCA +AGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAA +AAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACA +AGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAA +GGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAA +TATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGG +AGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACA +TCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGA +AGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAG +ATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAA +GGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAG +TCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGA +TCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAG +AAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGA +CCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTA +CAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGG +GGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAAT +CATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGA +GGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAG +GATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACA +TCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAA +GAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACAC +AAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAG +AATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAG +CAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAA +AGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGC +ACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGA +GGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACA +ACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCT +GCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGT +GCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACC +CAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATT +GCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGAC +AGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +TAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAA +TAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAA +AAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGA +GTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGG +ATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCT +GTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACA +GAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAA +GTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAG +ATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACC +CCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGT +GAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATA +AGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGAT +AATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGT +CCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATT +CTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTA +CAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTA +GCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATA +GTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAA +AGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATA +AGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTT +GAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGG +GACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACA +ACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGAT +GGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGA +AAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGG +TTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGA +GGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAG +CCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCA +GTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCA +GCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAA +AACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGC +ATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGC +CTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCT +AGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAA +AGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAG +CAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGG +TTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTG +ATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATAT +TCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGA +ATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTC +TTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGA +GACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATC +CTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATT +AGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTA +GTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAA +AGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGC +TGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCG +AGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTG +CGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGT +GCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAA +GGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGT +CTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAG +ATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAA +TCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGA +AAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGA +GAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCG +CTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGA +TGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTG +AGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCC +T +>MK115518.1 +TCCATTGCCCAGTTGTATCAGCTCAAGCTAGTTTCGCACAGAACCCTCTTACAAGAGCTG +CCGCCGAGACCGATACTAGTAGCGAGCGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCT +AGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGG +CGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAAC +TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACCTCCTAAATCTCTAGCAGTGG +CGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTC +CTAAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCCTCCTAAATCTCT +AGCAGTGGCGCCCGAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGC +CCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAACTCTGGACT +CTGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG +CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGC +GGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGA +TGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTT +AGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATC +AGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGA +ACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGT +ACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAA +GGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCAT +AGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGC +ATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGC +ATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACA +TCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAG +ATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAG +TGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCC +ACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGT +AAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAG +AGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAA +AAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTT +AAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGG +GGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAA +TGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTG +TGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAA +ATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGG +GAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCC +AACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAA +GCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAG +CGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGA +GCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATA +GGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGT +GGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGA +AATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTA +CCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAA +GAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCA +AAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGT +ACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGG +GAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTA +CTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACT +GCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTG +CTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTA +GAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTAT +GTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACAT +CTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTT +TGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAA +AAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGT +CAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCA +CTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAA +ATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAA +GTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAAT +CTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTA +ACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAA +TTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCC +ACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAA +TTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGA +GAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCC +CTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGAT +TCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCA +CAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAG +GAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTA +GACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCC +CAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATA +CCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAG +GCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTA +GAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTT +ATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGG +CCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCC +GCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAA +GGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAG +GCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAA +GGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTA +CAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGG +GACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCA +GTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATT +AGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGAT +TAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATG +GTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCC +ACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGA +ATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGT +TGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATC +TGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGG +ACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAG +AAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCA +GAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAA +CTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACAT +ATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAA +CAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCA +CAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGG +AAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCA +AGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCG +ACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGT +ATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAAT +AGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAG +GATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGA +AGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGT +TGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTAT +GGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGG +CACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAG +GATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGC +ATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCAC +TCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGG +AGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAA +ATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATG +ATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAA +AGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAA +AGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAAT +GTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAG +AAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTAC +ATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTA +TCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGAC +AAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAA +AATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACC +CAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACAC +AGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAA +ACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAG +CAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTAC +TATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAG +ATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCAT +TAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGG +GAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGT +CAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACA +ATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCA +AGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGG +GAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTT +GGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAG +AAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGG +AAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTA +ACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAG +GTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCAC +CATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCG +AAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGG +CACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACT +TACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCA +AACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCT +TATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTAC +AAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGG +CATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTA +AGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGAC +CTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCC +TGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCT +TTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGG +GGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTAC +AACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATAT +CCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAA +GGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAA +GAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAG +CATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGG +GGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCT +GCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCC +TGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115530.1 +TAACTAGCAGTCCCCCGCGGCGGCCCGGCAATGGCTGGACCCGACCCCCCAACCCCTGCC +GCCGGCGCCGACTATCGAGACTGGTAACCCCCCACCCCCCAACCCTAGCCGCGCGGCCCG +ACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACAGACTCTG +GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGC +AGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCATCCCAAATCTCTAGCAGTGG +CGCCCGAACAGACTCTGGTAACTAGAGATCCCCAGCTCTAGCAGTGGCGCCCGCGACTCT +GGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAG +CAGTGGCGCCCGACTGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGG +CCCCGAGCTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACA +GACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC +TGGTAACTAGAGATCCCTACTCCAATCTCAGCAGCTCTCTCGGCGCAGGACTCGGCTTGC +TGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTT +GACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAA +AATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAA +AACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAG +AAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGAT +CAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGA +TACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTA +AGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATT +ACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTT +TAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGT +TTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGG +GGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAAT +GGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAA +GGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAA +ATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATA +AAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAAC +CCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGG +AGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGA +CTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAG +GAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATT +CAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTT +TCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCT +GTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATT +TTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGAC +CAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCT +CTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCT +TTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGA +TACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAA +AATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGA +AATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAAT +TGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGA +AACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATT +GACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAA +AATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAA +AGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGA +CTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGT +AACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAA +GTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTA +CAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAA +AATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGA +TTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAG +ACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCC +ATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACT +GCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTG +GGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAAC +CAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAA +CAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAAT +AGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATT +TAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAA +ACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAAC +TCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTG +GCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATG +GTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGC +TAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGT +TATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTT +GCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCAT +TCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAAT +AAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGA +ACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGA +TAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTT +TAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAA +AGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTAC +ACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGC +AGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGG +GAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGT +TAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCA +AAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAG +AGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAA +AAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAAC +AGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTA +TTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGA +AGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAA +AATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGA +TGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTA +AAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTAC +ACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAG +AAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCA +CACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTT +CAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATC +AAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACAC +CAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACG +AGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTT +AGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGG +ACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAAC +CCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCAT +TGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGC +ACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTC +ATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGA +GACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +AAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAG +CAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGAC +AAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATG +AGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTG +GGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTA +CCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACC +ACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAA +GAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAA +CAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTA +ACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGT +AGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAA +ATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATA +GATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCC +TGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCG +ATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACA +GTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGT +TTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATA +ATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATG +AAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGAT +ATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTA +GTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGA +GGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAAT +ACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTA +GATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTA +GGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACA +GGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGA +GGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATT +GAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGA +GCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGC +GCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAG +CAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGG +GGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAG +CGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAAT +GCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGG +GAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAAC +CAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAAT +TGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGA +TTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGA +TATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAA +GGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGA +TTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTG +AGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAA +ATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCT +ATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAA +GTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTG +GAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCC +TGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATC +TCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGA +TTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCA +GGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGA +AAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTG +GGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGAC +CAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGC +CAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCC +GGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCG +AGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTT +TCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTC +AGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGAT +CTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT +GCCT +>MK115503.1 +GCTCTCGAACAGTGCGGACTCTGGTAACTAGAGATCCCTCAGCTCTAGCAGTGGCGCCCG +AACAGAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCTAAATCTCTAG +CAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTACTCTAGCAGTGGCGCCCAGA +ACATGGACTCTGGTAACTAGAGACCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGT +AACTAGAGATCCCTCCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAG +ATCCCTCCTAACTCTAGCAGTGCGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGC +AGTGGCGCCCGACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCG +CCCGAGAACAGATCTGGTAACTAGAGCCCTACTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACT +AGAGATCCTCCTAAATCTCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC +CCTCAGCTCTAGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGGGACTCTGGT +AACTAGAGATCCTCACTAAATCTAGCAGTGGCGCCGAGAGGAGACTCTCTCGGCGCAGGA +CTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGA +AAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATT +AAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAA +ATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCC +TGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCT +TCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGT +ACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCA +AAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAG +CAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATC +ACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGT +CATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCT +AAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGA +AGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGAT +GAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGC +ATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTT +GGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGG +ACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCA +AGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCC +AGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGAC +AGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAG +CCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGAT +TGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAG +GAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAG +ACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCT +TCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGAC +AATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCT +CAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAA +GCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAA +TGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAG +ATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCT +GTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATT +AGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAA +CAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAA +AAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCT +ATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAG +AGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAG +AAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAA +GAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATT +AGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGT +AGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAA +TACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATA +GAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAG +AAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAG +CCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGA +AAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTC +CTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAA +CTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCA +AAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTAT +CAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACT +AATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATA +TGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGG +GCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTA +GTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTA +GATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGA +AGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATT +TATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACA +TTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATA +GAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATT +GGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTA +GATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATG +GCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAA +TGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAA +CTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGA +TATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTG +AAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACC +AGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCC +TACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATA +GGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATC +CACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGAT +ATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAAT +TTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTC +TGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGG +AGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCA +AGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTC +AAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAG +TTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCT +GAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAG +GAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTT +TGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAG +GTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGC +ATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGA +TAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACA +TTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTC +CATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCC +ATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGC +AGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGA +GCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAA +GTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAG +GAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCT +ATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATT +AGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAA +AATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGA +CAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCA +CCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCT +ATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTA +AAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACC +CCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATA +ACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCAT +GTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATA +CCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATA +TCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATG +TAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCA +TTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGG +CTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAA +ATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGT +TAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATG +CTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACA +ACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCA +TAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTT +TAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATC +ACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTT +TCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATG +CTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGT +GGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCAT +CAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCT +TCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAG +TAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAA +GAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAA +GCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTA +TAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAAC +TCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAC +AGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTG +TGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCT +GGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAA +AGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAA +GTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGA +TAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAG +TTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCG +ACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGAT +TAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCT +GCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCA +GGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAA +AGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATA +GGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAA +GACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGG +GGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTG +GGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCT +ACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCA +GTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCAC +TTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATC +CTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCA +GGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAG +CCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGG +ATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCAT +CACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTAC +AAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGT +GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGG +TTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCT +CAATAAAGCTTGCCTTG +>MK115509.1 +CCCCAAATCTCTAGCCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCCCAAATCTCT +AGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCC +TAAATCTCTAGCAGTGGCGCCCGAAGACTCTGGTAACTAGAGATCCCTCACCCTAAATCT +CTAGCAGTGGCGCCCGCTCGTACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCACCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTG +GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAAC +TAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTACTAGAGA +TCCCTCAAATCAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCAC +AGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAG +GCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCA +TGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTA +TGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAG +GGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTT +AAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAA +GACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCA +CAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTG +CAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGG +GTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTA +TCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAA +GCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTG +CATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGAC +ATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCT +ATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGG +ATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGAC +TATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAAT +TGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAA +GCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGA +CCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTA +ATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGC +AAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGT +GGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAA +ATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACA +GCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAG +GAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGAC +CCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAG +ATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGG +GAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGAC +ACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATC +TGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAG +TAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAA +AAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAA +TTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTA +AATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAG +TTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGG +ATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCAT +TTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGC +CACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGC +CTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAG +GATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGT +TAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGA +TGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAG +ACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGA +TTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAA +CAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTT +TAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTAC +AGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGA +AAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAG +AGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTA +GACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCT +GGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAG +AGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAA +CTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAA +CGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGG +GATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAAC +CAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAA +AAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACA +AACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAG +AAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCC +CTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCA +TGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAG +GGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTC +CAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAG +TAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCT +GTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAG +TAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTG +AACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGG +GGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAA +CTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACA +GCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAG +TAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGG +ATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGA +ACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTT +TATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTA +GGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGG +CATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGAC +CCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCT +ATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACAT +AACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGA +AAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAG +ACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTA +AGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCT +ATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAAC +TGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGA +GGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGT +CAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTT +TGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGA +AGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATAT +GTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCA +ATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATA +GACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGG +GATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGAT +GATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAA +AGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACA +TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATT +GGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGA +GGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG +TGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGG +AAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAA +GATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAA +TACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGT +ATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTG +TAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTAC +ACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGA +AGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCT +GAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCC +TCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGC +ACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATT +AAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGA +AATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCT +GTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACAT +CACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAAT +GTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATT +AGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATAT +GAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGG +AGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAAT +AGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGT +GACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTT +GCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCA +GCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAAT +TTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAG +TAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAAT +TAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAA +AAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACAT +AACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTT +AAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATT +ATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGA +AGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACT +TTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACT +CTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACA +TTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATT +CAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAG +AGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATT +GTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGG +AAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGG +AAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGC +TGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAA +GACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGAC +TGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCAC +TGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAG +AGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAG +TATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATC +CGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGAC +TTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCAT +ATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGG +AGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115490.1 +CGCTAGTTTAGAGATACTCTTATAACTACAGAACACGCCAACCAAATCGCTAAGAGGGGG +GGCCCGACTGTGGTTACTAAAGATCCATCCAAAATCTCTAGCAGTGGCGCCCGAACAGAC +TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGC +AGTGGCGCCCAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGA +ACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC +TGGTAACTAGAGATCCCTCAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTG +GCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGA +ACAAATCTCAGCAGGGGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAA +GAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGA +AGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAA +AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCA +AGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGT +AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCA +TTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACC +AAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAA +GTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAAC +CTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAA +GTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAA +GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCT +ATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCA +GTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCA +GGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCA +GTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTAT +AGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTA +GACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG +ACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTA +GGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGC +CATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATG +CAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAA +GGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAG +GAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGG +CCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCA +CCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCA +AGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCG +TCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATA +CAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTG +GAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAG +CTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGA +CTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAAT +TAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAA +AAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGC +CTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGA +GAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAAT +TAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGG +GTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCA +TACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGG +GATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTA +GAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTG +ACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGT +GGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTT +ATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCT +GGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACG +CAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGG +TAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAG +AACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGC +AGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAG +GAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAG +TACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTAC +CTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTC +CTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAG +AACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAAT +TAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACA +CAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAG +AAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATA +AGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCT +ACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAG +TCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACC +ATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAG +TAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATG +GACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAG +TTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAG +AGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAA +CAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGT +GGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAG +AATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATC +TTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTG +GGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAG +AATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAG +ATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATAC +AAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATG +GCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGG +AACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGA +CATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGAT +GCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTG +GGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGAC +CTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGA +AATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAG +GTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCA +CCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAG +GGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATG +AAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAA +CTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGT +TTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAG +CAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCT +AAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTC +ATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCT +CCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATG +CAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTT +GTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGG +TTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAG +GAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTG +TAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGC +AAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGT +TTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAA +TGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGT +AATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAC +TTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGAT +GGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCA +GAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAG +TTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTT +TGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGA +TAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGG +AATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGT +AGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGA +ACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGG +ACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTG +TAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGA +ACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTAT +AATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAA +TAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACT +CCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGC +CCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAG +AGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGA +CAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGC +ACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGC +TGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCT +GACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAG +AGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCA +GGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGG +TTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAA +ATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAA +TTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGA +ACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAA +ATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAAT +AGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTT +TCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGG +TGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTG +GGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGAT +TGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTG +GAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGT +CACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTG +TAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATA +AAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAA +TGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGAC +ATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAG +CACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAA +TGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAG +GGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAG +GCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCT +TTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACA +ACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAA +TGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGT +ACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTTCGCTGGGGACTTTCCA +GGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGC +AGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCT +CTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115576.1 +AACAGACTCTGGTAAGTAGTGGTCCGCTCAAAATCTCTAGCAGTGGCGCCCGACTCTGGT +AACTAGAGATCCCTCAAAATCTCTAGCAGTGGCGCCCGATCAAAATCTCTAGCAGTGGCG +CCCGAGACTCTGGAACTAGAGATCCAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAG +AGATCCCTCAGTGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCC +CTCAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCAAATCTCTA +GCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCAGTGAAATCTCTAGCAGGAGCTCT +CTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGG +TGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGA +GCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGG +GGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTT +GCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTA +CAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTC +CTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTA +GAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGAC +ACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACAT +CAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTC +AGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTA +AACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACC +ATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCA +CCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAG +GAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGA +TGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGAT +ATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTA +AGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAA +AATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAG +GAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCT +GAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAAC +CAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGC +AGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGAC +TGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCA +GGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTT +GGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCC +TTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGC +AATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTT +TGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGAC +AGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAG +GACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAA +ATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCC +CAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTA +CAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTC +CAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAG +AACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAG +GGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTC +CCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGA +CACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAA +TATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAG +TTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATA +GAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACA +AAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGT +GGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGA +AGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAAT +TATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAG +CAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATT +ATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACAT +ATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGG +GTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAA +GCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGG +AGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATA +CCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAA +CTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCA +CTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGT +TACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACT +CACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCA +ATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCAC +ACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAG +TACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATT +GGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCA +GCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAG +GAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATG +TAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCAT +ACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCA +GCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAAT +TTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAA +AGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGG +CAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAA +GAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAA +AAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAG +CAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAG +TAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATG +ATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCAT +ATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCAT +CCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACA +TATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAA +TGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCAT +CTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATA +GTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTG +GCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAA +CTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACA +ATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTA +GGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAG +GAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGT +GTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGAT +CCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGC +TATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATC +TCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGAT +CAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCA +ATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATA +GAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAA +AGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATG +GAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTG +GGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGC +ATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGT +ACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACAT +GTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAG +CCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAA +TGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTG +CTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTA +TAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAA +CACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTA +TTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGG +ACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAAC +TCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTT +CACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTAC +AAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGC +AACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATG +GAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAAT +AATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGG +AGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTG +GACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGAT +TATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAAT +TAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGA +GACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATA +TAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAG +AGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGG +AGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTT +ATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACA +TCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGA +AAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTG +CACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGA +TAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACAC +CTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGA +TAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATT +ATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTAT +AGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCC +GAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAG +ATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTG +CCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACT +TCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGAT +TCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGA +GGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACC +TACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAA +AAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAG +CAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCA +ATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAG +TGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCG +ATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAA +GACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGA +ACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAG +TACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGA +GCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCC +TAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATT +GAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGG +GACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGG +GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCAC +TGCTTAAGCCTCAATAAAGCTTGCCT diff --git a/tests/expected-results-large-csv/nonintact.fasta b/tests/expected-results-large-csv/nonintact.fasta index 9113fa3..29434e4 100644 --- a/tests/expected-results-large-csv/nonintact.fasta +++ b/tests/expected-results-large-csv/nonintact.fasta @@ -264,169 +264,6 @@ ACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGAT TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTC ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA >MN090335 GGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGGCTCCTTCTGATAA TGCTGAAAACATGGGTATTACTTCTGGGCTGAAAGCCTTTTCTTCTACTACTTTTACCCA @@ -731,166 +568,6 @@ CCGCTAGGGACTTTCCAGGGGAGGCGTGAACTGGGCGGGACAGGGGAGTGGCGAGCCCTC AGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGAT CAGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT GCCTTGAGTGCTTAAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC ->MK115581.1 -AAATTGGGACGTTCGCCTACGCAAGCGAAAATTTCTCTACGTAGCCACCTTTCCCGATTA -ACGTCAGAACCCTAAAATTAAAATAAATCCTAGCGGCCGACCGACTCTGGTAACTAGAGA -TCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC -TCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACA -GACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAATCATCTT -AGAGTGGCGCCCGAACGACTCTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGT -GGCGCCCGCGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCG -AGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGACT -CTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGACACAGGTACTA -GAGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG -CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAG -CGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAG -ATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATT -TAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACAT -CAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAG -AACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGG -TACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAA -AGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCA -TAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATG -CATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAG -CATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGAC -ATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATA -GATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAA -GTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATC -CACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAG -TAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTA -GAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAA -AAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTT -TAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGG -GGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTA -ATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATT -GTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGA -AATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAG -GGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGC -CAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGA -AGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCA -GCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGG -AGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGAT -AGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTG -TGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAG -AAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGT -ACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGA -AGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTC -AAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAG -TACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTG -GGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGT -ACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATAC -TGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGT -GCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTT -AGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTA -TGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACA -TCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCT -TTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGA -AAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAG -TCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGC -ACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGA -AATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGA -AGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAA -TCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATT -AACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAA -ATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGC -CACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCA -ATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAG -AGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTC -CCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGA -TTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGC -ACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAA -GGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGT -AGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGC -CCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATAT -ACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGA -GGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCT -AGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGT -TATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATG -GCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGC -CGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCA -AGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCA -GGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAA -AGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCT -ACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAG -GGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGC -AGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCAT -TAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGA -TTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGAT -GGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCC -CACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAG -AATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAG -TTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAAT -CTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAG -GACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGA -GAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACC -AGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGA -ACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACA -TATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCA -ACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCC -ACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAG -GAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCC -AAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGC -GACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAG -TATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAA -TAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAA -GGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTG -AAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATG -TTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTA -TGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAG -GCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTA -GGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATG -CATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCA -CTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAG -GAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGA -AATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAT -GATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCA -AAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTA -AAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAA -TGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCA -GAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTA -CATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGT -ATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGA -CAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAA -AAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGAC -CCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACA -CAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGA -AACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAA -GCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTA -CTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGA -GATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCA -TTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTG -GGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCG -TCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAAC -AATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATC -AAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTG -GGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGT -TGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGA -GAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAG -GAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTT -AACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATA -GGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCA -CCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATC -GAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTG -GCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGAC -TTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTC -AAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGC -TTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTA -CAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGG -GCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGT -AAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGA -CCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGC -CTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCC -TTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGG -GGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTA -CAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATA -TCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCA -AGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAA -AGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAA -GCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTG -GGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGC -TGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGC -CTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTG -CACTCAAGGCAAGCT >MK115690.1 TGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACA CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCAC @@ -1686,165 +1363,6 @@ CCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGAC CAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAA AGCTTGCCTTGCACTCAAGGCAAGCTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC TAGAGA ->MK115498.1 -AACACGGAATGGGAGATAAGCAGCATCTCTATCGGCGCGGCGAGATCTGACACTGGTAAC -TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC -CCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCCTAAATCTC -TAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTG -GCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC -TCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGAC -TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAA -CTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACTAGAGATCCCT -CACCCTAGATCTCTAGCAGTGGCGCCCGCGAAGGCACTAGGACCTGAAAGCGAAAGTAAA -ACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGA -GGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGA -GAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATT -CGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGG -GAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAA -ATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTT -AATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAA -GCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCA -GCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAG -GGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTA -GAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCC -ACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAA -ATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAT -GCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACT -ACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGA -GAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCT -ACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGG -TTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAA -ACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCA -GCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAA -GCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGA -GGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCAC -ATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGA -CATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCC -CACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAA -GAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGAC -AAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAA -TAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTAT -TAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTT -TTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAG -GTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGC -TTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGC -CAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCAT -TAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAA -ATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAAT -TAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAA -TACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATG -CATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTA -GTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGA -AAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGC -AAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAG -AAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGAC -TTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAAC -TCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTG -TCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGA -TTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTAC -CACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAG -TACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCA -ATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAAT -ATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAA -AGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATAC -AAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGT -GGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCA -TAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCA -AAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAA -ATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAA -ACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTG -AATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGG -CATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTA -CTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGA -AATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAA -AAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAG -TAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCC -TGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAG -GGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATAC -ATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAG -GGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCA -TGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGA -CAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGT -ATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTAC -AGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCAC -TTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATA -ATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAAC -AGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGT -TTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCAC -TATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGA -TTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAG -GGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCA -GACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCC -ATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGC -TCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTA -CCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCAC -AGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGG -TTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATG -GGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTC -ATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAA -ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACT -CCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAA -AAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAA -GGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCT -CTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGG -ACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATT -GATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAA -TTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGC -TACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACAC -CACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGC -CACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGAC -AGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAA -TTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAA -TTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGA -AGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGA -ATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATAC -ATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCC -AATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAA -GTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAA -GCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAAT -TAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTAT -ACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGG -AAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCT -TAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATA -TGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCA -TACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTAC -TTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATG -CAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCC -CATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGG -TGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTG -GAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCAC -CAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTT -CCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGT -ACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTAT -TGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAG -AGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTC -TGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCT -GAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACAC -AGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGA -ATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCT -GTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTT -TGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGAC -CCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGA -AAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGA -CCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAAC -AAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCT -CCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGC -CATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGC -TCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGG -GGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGAC -GAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAG -CAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAG -AAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTT -TCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAA -TTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACT -TCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGT -GGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCT -TGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGA -AGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACA -AAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAG -GTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGC -GTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCT -AACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115211.1 CTTCTAGCCTCCGCTAGTCAAAACGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAA GCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTTTCAAGTCCCTGTTCG @@ -2777,165 +2295,6 @@ CATAGAGTTTTCCACCAGGGACTTTCCAGAAGAGGCGTGGCCTGGGCGGGACCGGGGAGT GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTGCCTGTACTGGGTCTCTCTGGT TAGACCAGATCTGAGCCTGGGAGCTCTCTGTCTAACTAGGGAACCCACTGCTTAAGCCTC AATAAAGCTTGCCTTG ->MK115491.1 -CTGATTTGCTGTGGCGGCCGCAAGGACTCAAGTAGGTAACTATAGAAACCCCCCACCAAT -TCTCTAGCAGTGGCGTCCGACGCTGGCCAAAACTCTCTAGCAGTGGCGCCCGAACAGACT -CTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAG -ATCCCAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATC -TCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTG -GCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCGCCC -GACTCTGGTAACTAGAGATCCCTCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTA -GAGACTCAGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACG -CCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAA -TATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGA -AAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTA -ACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCAT -CCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATT -GTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAG -AGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAA -ACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCC -TATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAG -AAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCA -TGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATG -AGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCC -AGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAA -TAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAA -TCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAAC -AAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTG -AGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGA -ATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGA -TGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAA -TGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAA -AGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCC -CTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAG -AGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACT -TCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAG -AGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTT -CCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAA -AGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGG -AAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGA -TCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTAC -ACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCC -CATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGT -TAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAAT -GGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATT -TGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAA -TAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAA -AAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGA -TAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGG -GATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCA -AAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTA -TCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAA -AATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACA -TCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGT -ACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGT -GGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAA -ACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCT -AGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCC -ATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAAT -TTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCA -CACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGT -AATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATG -GTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCC -CTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTA -TGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAG -AGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGC -AATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATA -TACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGAT -AATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGG -AATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATT -TCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGC -AATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGA -TAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATG -GCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAG -TGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCT -CCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTT -CACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCAT -TCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAAT -TATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATT -CATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGT -AGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCA -AAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCT -TCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCC -AAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGT -GGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATG -TTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAA -TAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGG -GCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAA -AAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATT -ACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTC -CTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAA -AAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAG -AGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATG -GACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTG -GCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGA -GGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACA -TAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGAC -TAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTA -AAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATG -GCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATT -CTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAG -GATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATA -GGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAA -AAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGG -GGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACA -GTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGAT -GCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACA -GACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAA -AATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAG -CCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACT -AATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTC -AATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTT -GATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCA -GTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCC -CCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGT -AAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTA -CTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAAC -AATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCC -AACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGA -GCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAAT -ACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTT -AATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAA -TTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGG -AATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAAC -AGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGT -TCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAG -ACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATAT -AAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTG -CAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCA -GGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCT -GGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTG -CAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATAC -CTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACT -GCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATG -ACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATT -GAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGG -GCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATA -ATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAAT -AGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGA -CCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTT -CGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTC -CTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGA -CGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAG -CTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACA -GATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGA -ATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAG -TGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGG -GGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGC -AGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTT -TCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAG -CCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGA -TATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACAC -ACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGT -GGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCA -TGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATT -TCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTT -CTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGG -GAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCT -CTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAA -GCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC -GCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACTCTGG -TA >MK116110.1 CCTGAAAGCGAAAGTAGAACCAGAGAAGTTCTCTCGACGCAGGACTCGGCTTGCTGAGCT TTATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCT @@ -3087,166 +2446,6 @@ CTGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCCGCTTTCGCCTGTACTGGGTC TCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTGGGGAACCCACTGCT TAAGCCTCAATAAAGCTTGCCTTGAGTGCTTAAAGTAGTGTGTGCCCGTCTGTTGTGTGA CTCTGGTAGTTACCAGAGTCACACAAC ->MK115527.1 -ACCTATTACAGCCCATAAAGAGGAGAAACGAACATAAAGCTAGTGCAAACCTGACTGCCC -GAGGCAGGGAGCTAGAGTTAGGTAACTAAAGCTCAATCACTAGCGCTCGAGCATGAGGGA -CTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACATAAATCTCT -AGCAGTGGCGCCCTAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAG -CAGTGGCGCCCGAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCA -GTGGCGCCCGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGA -ACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAAC -ATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACAT -GACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGCGCGACATGAGGCTCGGT -AACTAGAGATCCTCAGTAAATCCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAA -GCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGAC -TAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAAT -TAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAAC -ATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAA -CATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAG -AAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAC -AGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGA -AAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACC -CCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAA -ATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTT -CAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGG -GACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGG -ATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGG -GAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATA -ATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAA -TAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCT -TTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGG -TAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTA -TTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAG -TGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAG -CTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCA -ATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTT -GGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTT -TAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAG -AGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTC -AGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTG -GCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATAC -AGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAAT -GATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAAT -CTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGG -AAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAAC -TGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGAC -AGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAAT -TTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGA -CAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTT -TTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAAC -AGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTA -TACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAA -TGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAAT -CTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTT -GTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACA -ACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATT -CCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCC -AGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGC -AAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAA -AGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAG -GGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGC -AGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAA -AAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACA -ATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCC -TAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCA -AGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTA -CCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAA -TAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTAT -CTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCA -GGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCA -AGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAA -AAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACA -AGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAA -GGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAA -TATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGG -AGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACA -TCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGA -AGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAG -ATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAA -GGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAG -TCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGA -TCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAG -AAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGA -CCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTA -CAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGG -GGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAAT -CATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGA -GGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAG -GATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACA -TCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAA -GAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACAC -AAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAG -AATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAG -CAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAA -AGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGC -ACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGA -GGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACA -ACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCT -GCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGT -GCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACC -CAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATT -GCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGAC -AGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -TAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAA -TAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAA -AAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGA -GTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGG -ATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCT -GTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACA -GAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAA -GTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAG -ATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACC -CCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGT -GAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATA -AGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGAT -AATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGT -CCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATT -CTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTA -CAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTA -GCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATA -GTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAA -AGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATA -AGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTT -GAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGG -GACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACA -ACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGAT -GGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGA -AAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGG -TTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGA -GGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAG -CCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCA -GTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCA -GCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAA -AACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGC -ATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGC -CTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCT -AGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAA -AGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAG -CAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGG -TTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTG -ATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATAT -TCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGA -ATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTC -TTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGA -GACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATC -CTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATT -AGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTA -GTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAA -AGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGC -TGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCG -AGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTG -CGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGT -GCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAA -GGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGT -CTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAG -ATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAA -TCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGA -AAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGA -GAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCG -CTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGA -TGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTG -AGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCC -T >MK114997.1 TGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTTTCAAGTCCCTGTTCGGGCGCCACT GCTAAGATTAGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACT @@ -3399,166 +2598,6 @@ CTGCATCCGGAATATTTCAAGGACTGCTGACACTGAGATTTCTACAAGGGACTTTCCGCT GGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCTCAGATG CTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAG CCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT ->MK115518.1 -TCCATTGCCCAGTTGTATCAGCTCAAGCTAGTTTCGCACAGAACCCTCTTACAAGAGCTG -CCGCCGAGACCGATACTAGTAGCGAGCGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCT -AGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGG -CGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAAC -TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACCTCCTAAATCTCTAGCAGTGG -CGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTC -CTAAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCCTCCTAAATCTCT -AGCAGTGGCGCCCGAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGC -CCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAACTCTGGACT -CTGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG -CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGC -GGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGA -TGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTT -AGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATC -AGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGA -ACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGT -ACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAA -GGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCAT -AGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGC -ATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGC -ATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACA -TCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAG -ATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAG -TGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCC -ACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGT -AAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAG -AGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAA -AAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTT -AAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGG -GGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAA -TGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTG -TGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAA -ATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGG -GAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCC -AACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAA -GCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAG -CGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGA -GCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATA -GGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGT -GGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGA -AATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTA -CCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAA -GAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCA -AAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGT -ACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGG -GAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTA -CTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACT -GCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTG -CTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTA -GAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTAT -GTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACAT -CTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTT -TGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAA -AAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGT -CAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCA -CTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAA -ATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAA -GTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAAT -CTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTA -ACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAA -TTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCC -ACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAA -TTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGA -GAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCC -CTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGAT -TCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCA -CAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAG -GAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTA -GACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCC -CAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATA -CCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAG -GCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTA -GAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTT -ATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGG -CCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCC -GCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAA -GGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAG -GCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAA -GGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTA -CAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGG -GACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCA -GTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATT -AGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGAT -TAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATG -GTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCC -ACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGA -ATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGT -TGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATC -TGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGG -ACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAG -AAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCA -GAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAA -CTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACAT -ATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAA -CAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCA -CAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGG -AAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCA -AGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCG -ACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGT -ATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAAT -AGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAG -GATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGA -AGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGT -TGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTAT -GGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGG -CACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAG -GATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGC -ATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCAC -TCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGG -AGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAA -ATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATG -ATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAA -AGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAA -AGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAAT -GTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAG -AAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTAC -ATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTA -TCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGAC -AAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAA -AATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACC -CAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACAC -AGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAA -ACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAG -CAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTAC -TATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAG -ATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCAT -TAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGG -GAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGT -CAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACA -ATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCA -AGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGG -GAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTT -GGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAG -AAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGG -AAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTA -ACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAG -GTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCAC -CATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCG -AAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGG -CACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACT -TACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCA -AACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCT -TATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTAC -AAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGG -CATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTA -AGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGAC -CTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCC -TGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCT -TTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGG -GGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTAC -AACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATAT -CCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAA -GGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAA -GAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAG -CATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGG -GGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCT -GCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCC -TGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115065.1 TAGCCTCCGCTAGTCAAAAATTTCGGCGTACTCACCAGTCGCCGCGCCTCGCCTCTTGCC GTGCGCGCTCAGCAAGCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTT @@ -3877,167 +2916,6 @@ AAGAGGCGTGGCCTAGGCAGGACCGAAGAGTGGCGAGCCCTCAGATGCTGCATAAAAGCA GCTGCTTTTGCCTGTACTAGGTCTCTCTAGTTAGACCAGATCTGAGCCTAGGAGCTCTCT GTCTAACTAAGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTA GTG ->MK115530.1 -TAACTAGCAGTCCCCCGCGGCGGCCCGGCAATGGCTGGACCCGACCCCCCAACCCCTGCC -GCCGGCGCCGACTATCGAGACTGGTAACCCCCCACCCCCCAACCCTAGCCGCGCGGCCCG -ACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACAGACTCTG -GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGC -AGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCATCCCAAATCTCTAGCAGTGG -CGCCCGAACAGACTCTGGTAACTAGAGATCCCCAGCTCTAGCAGTGGCGCCCGCGACTCT -GGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAG -CAGTGGCGCCCGACTGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGG -CCCCGAGCTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACA -GACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC -TGGTAACTAGAGATCCCTACTCCAATCTCAGCAGCTCTCTCGGCGCAGGACTCGGCTTGC -TGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTT -GACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAA -AATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAA -AACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAG -AAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGAT -CAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGA -TACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTA -AGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATT -ACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTT -TAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGT -TTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGG -GGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAAT -GGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAA -GGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAA -ATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATA -AAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAAC -CCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGG -AGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGA -CTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAG -GAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATT -CAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTT -TCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCT -GTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATT -TTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGAC -CAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCT -CTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCT -TTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGA -TACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAA -AATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGA -AATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAAT -TGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGA -AACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATT -GACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAA -AATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAA -AGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGA -CTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGT -AACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAA -GTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTA -CAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAA -AATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGA -TTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAG -ACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCC -ATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACT -GCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTG -GGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAAC -CAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAA -CAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAAT -AGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATT -TAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAA -ACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAAC -TCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTG -GCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATG -GTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGC -TAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGT -TATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTT -GCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCAT -TCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAAT -AAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGA -ACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGA -TAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTT -TAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAA -AGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTAC -ACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGC -AGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGG -GAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGT -TAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCA -AAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAG -AGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAA -AAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAAC -AGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTA -TTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGA -AGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAA -AATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGA -TGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTA -AAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTAC -ACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAG -AAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCA -CACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTT -CAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATC -AAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACAC -CAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACG -AGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTT -AGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGG -ACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAAC -CCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCAT -TGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGC -ACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTC -ATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGA -GACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT -AAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAG -CAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGAC -AAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATG -AGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTG -GGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTA -CCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACC -ACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAA -GAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAA -CAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTA -ACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGT -AGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAA -ATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATA -GATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCC -TGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCG -ATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACA -GTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGT -TTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATA -ATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATG -AAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGAT -ATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTA -GTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGA -GGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAAT -ACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTA -GATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTA -GGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACA -GGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGA -GGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATT -GAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGA -GCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGC -GCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAG -CAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGG -GGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAG -CGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAAT -GCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGG -GAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAAC -CAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAAT -TGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGA -TTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGA -TATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAA -GGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGA -TTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTG -AGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAA -ATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCT -ATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAA -GTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTG -GAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCC -TGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATC -TCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGA -TTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCA -GGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGA -AAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTG -GGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGAC -CAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGC -CAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCC -GGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCG -AGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTT -TCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTC -AGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGAT -CTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT -GCCT >MK115520.1 ATCTCTAGCAGAAGCGCCCGACCAGACTCTGGCGACCGGACACCGTTCATCCCTTGGAGA CCCGCCAGACTCAAGCTATTGCAGTGGCGCCCGACTCTGGAACTAGAGATCCCTCACCCT @@ -4199,168 +3077,6 @@ AGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTC TGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAG CCTCAATAAAGCTTTGCCTTCTAGATGTGTACAATCTAGTTGCCATATTCCTGGACTACA ATCTACTTGTCCATGCATGGCCTCTCCTTTTGCTGACATTTATCACAGC ->MK115503.1 -GCTCTCGAACAGTGCGGACTCTGGTAACTAGAGATCCCTCAGCTCTAGCAGTGGCGCCCG -AACAGAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCTAAATCTCTAG -CAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTACTCTAGCAGTGGCGCCCAGA -ACATGGACTCTGGTAACTAGAGACCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGT -AACTAGAGATCCCTCCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAG -ATCCCTCCTAACTCTAGCAGTGCGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGC -AGTGGCGCCCGACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCG -CCCGAGAACAGATCTGGTAACTAGAGCCCTACTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACT -AGAGATCCTCCTAAATCTCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC -CCTCAGCTCTAGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGGGACTCTGGT -AACTAGAGATCCTCACTAAATCTAGCAGTGGCGCCGAGAGGAGACTCTCTCGGCGCAGGA -CTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGA -AAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATT -AAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAA -ATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCC -TGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCT -TCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGT -ACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCA -AAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAG -CAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATC -ACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGT -CATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCT -AAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGA -AGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGAT -GAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGC -ATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTT -GGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGG -ACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCA -AGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCC -AGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGAC -AGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAG -CCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGAT -TGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAG -GAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAG -ACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCT -TCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGAC -AATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCT -CAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAA -GCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAA -TGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAG -ATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCT -GTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATT -AGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAA -CAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAA -AAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCT -ATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAG -AGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAG -AAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAA -GAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATT -AGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGT -AGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAA -TACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATA -GAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAG -AAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAG -CCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGA -AAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTC -CTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAA -CTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCA -AAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTAT -CAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACT -AATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATA -TGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGG -GCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTA -GTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTA -GATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGA -AGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATT -TATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACA -TTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATA -GAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATT -GGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTA -GATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATG -GCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAA -TGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAA -CTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGA -TATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTG -AAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACC -AGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCC -TACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATA -GGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATC -CACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGAT -ATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAAT -TTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTC -TGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGG -AGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCA -AGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTC -AAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAG -TTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCT -GAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAG -GAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTT -TGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAG -GTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGC -ATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGA -TAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACA -TTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTC -CATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCC -ATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGC -AGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGA -GCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAA -GTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAG -GAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCT -ATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATT -AGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAA -AATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGA -CAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCA -CCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCT -ATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTA -AAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACC -CCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATA -ACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCAT -GTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATA -CCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATA -TCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATG -TAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCA -TTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGG -CTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAA -ATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGT -TAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATG -CTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACA -ACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCA -TAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTT -TAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATC -ACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTT -TCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATG -CTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGT -GGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCAT -CAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCT -TCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAG -TAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAA -GAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAA -GCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTA -TAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAAC -TCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAC -AGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTG -TGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCT -GGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAA -AGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAA -GTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGA -TAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAG -TTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCG -ACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGAT -TAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCT -GCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCA -GGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAA -AGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATA -GGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAA -GACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGG -GGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTG -GGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCT -ACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCA -GTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCAC -TTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATC -CTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCA -GGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAG -CCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGG -ATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCAT -CACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTAC -AAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGT -GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGG -TTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCT -CAATAAAGCTTGCCTTG >MK115570.1 AACGTGTCGTGCCCCCAAAACATAACGTAAACGTGGAAGCGGAGAGCCTTAAGGTAACTG CGGGGCCCCAAATCCAATATCTAGGGCGCCCGAACGAGACTCTGGTAACTAGAGATCCCT @@ -4521,163 +3237,6 @@ TCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCT CAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGA TCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCT TGCCT ->MK115509.1 -CCCCAAATCTCTAGCCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCCCAAATCTCT -AGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCC -TAAATCTCTAGCAGTGGCGCCCGAAGACTCTGGTAACTAGAGATCCCTCACCCTAAATCT -CTAGCAGTGGCGCCCGCTCGTACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCACCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTG -GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAAC -TAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTACTAGAGA -TCCCTCAAATCAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCAC -AGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAG -GCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCA -TGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTA -TGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAG -GGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTT -AAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAA -GACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCA -CAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTG -CAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGG -GTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTA -TCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAA -GCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTG -CATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGAC -ATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCT -ATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGG -ATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGAC -TATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAAT -TGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAA -GCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGA -CCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTA -ATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGC -AAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGT -GGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAA -ATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACA -GCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAG -GAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGAC -CCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAG -ATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGG -GAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGAC -ACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATC -TGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAG -TAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAA -AAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAA -TTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTA -AATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAG -TTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGG -ATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCAT -TTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGC -CACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGC -CTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAG -GATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGT -TAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGA -TGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAG -ACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGA -TTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAA -CAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTT -TAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTAC -AGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGA -AAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAG -AGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTA -GACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCT -GGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAG -AGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAA -CTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAA -CGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGG -GATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAAC -CAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAA -AAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACA -AACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAG -AAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCC -CTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCA -TGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAG -GGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTC -CAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAG -TAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCT -GTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAG -TAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTG -AACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGG -GGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAA -CTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACA -GCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAG -TAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGG -ATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGA -ACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTT -TATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTA -GGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGG -CATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGAC -CCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCT -ATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACAT -AACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGA -AAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAG -ACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTA -AGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCT -ATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAAC -TGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGA -GGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGT -CAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTT -TGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGA -AGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATAT -GTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCA -ATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATA -GACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGG -GATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGAT -GATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAA -AGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACA -TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATT -GGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGA -GGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG -TGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGG -AAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAA -GATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAA -TACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGT -ATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTG -TAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTAC -ACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGA -AGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCT -GAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCC -TCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGC -ACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATT -AAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGA -AATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCT -GTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACAT -CACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAAT -GTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATT -AGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATAT -GAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGG -AGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAAT -AGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGT -GACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTT -GCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCA -GCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAAT -TTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAG -TAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAAT -TAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAA -AAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACAT -AACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTT -AAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATT -ATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGA -AGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACT -TTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACT -CTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACA -TTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATT -CAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAG -AGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATT -GTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGG -AAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGG -AAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGC -TGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAA -GACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGAC -TGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCAC -TGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAG -AGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAG -TATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATC -CGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGAC -TTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCAT -ATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGG -AGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115702.1 GAATACTGCCATTTGTACTGCTGTCTTAAGATGTTCAGCCTGATCTCTGACCTGTCCTAT TATTTTCTTTAATTCTTTATTCATAGATTCTACCACTCCTTGACTCTGGGGATTGTAGGG @@ -4985,319 +3544,6 @@ GGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTAGGTCT CTCTGGTTAGACCAGATCTGAGCCTAGGAGCTCTCTGGCTAACTAGAGAACCCACTGCTT AAGCCTCAATAAAGCTTGCCTTGAGTGCTATAAGTAGTGTGTGCCCGTCTGTTGTGTGAC TCTGGTAACTAGAGATC ->MK115490.1 -CGCTAGTTTAGAGATACTCTTATAACTACAGAACACGCCAACCAAATCGCTAAGAGGGGG -GGCCCGACTGTGGTTACTAAAGATCCATCCAAAATCTCTAGCAGTGGCGCCCGAACAGAC -TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGC -AGTGGCGCCCAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGA -ACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC -TGGTAACTAGAGATCCCTCAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTG -GCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGA -ACAAATCTCAGCAGGGGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAA -GAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGA -AGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAA -AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCA -AGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGT -AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCA -TTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACC -AAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAA -GTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAAC -CTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAA -GTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAA -GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCT -ATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCA -GTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCA -GGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCA -GTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTAT -AGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTA -GACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG -ACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTA -GGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGC -CATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATG -CAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAA -GGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAG -GAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGG -CCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCA -CCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCA -AGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCG -TCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATA -CAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTG -GAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAG -CTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGA -CTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAAT -TAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAA -AAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGC -CTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGA -GAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAAT -TAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGG -GTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCA -TACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGG -GATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTA -GAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTG -ACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGT -GGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTT -ATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCT -GGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACG -CAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGG -TAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAG -AACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGC -AGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAG -GAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAG -TACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTAC -CTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTC -CTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAG -AACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAAT -TAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACA -CAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAG -AAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATA -AGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCT -ACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAG -TCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACC -ATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAG -TAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATG -GACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAG -TTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAG -AGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAA -CAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGT -GGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAG -AATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATC -TTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTG -GGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAG -AATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAG -ATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATAC -AAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATG -GCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGG -AACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGA -CATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGAT -GCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTG -GGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGAC -CTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGA -AATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAG -GTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCA -CCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAG -GGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATG -AAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAA -CTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGT -TTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAG -CAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCT -AAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTC -ATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCT -CCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATG -CAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTT -GTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGG -TTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAG -GAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTG -TAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGC -AAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGT -TTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAA -TGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGT -AATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAC -TTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGAT -GGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCA -GAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAG -TTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTT -TGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGA -TAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGG -AATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGT -AGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGA -ACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGG -ACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTG -TAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGA -ACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTAT -AATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAA -TAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACT -CCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGC -CCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAG -AGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGA -CAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGC -ACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGC -TGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCT -GACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAG -AGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCA -GGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGG -TTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAA -ATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAA -TTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGA -ACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAA -ATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAAT -AGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTT -TCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGG -TGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTG -GGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGAT -TGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTG -GAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGT -CACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTG -TAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATA -AAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAA -TGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGAC -ATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAG -CACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAA -TGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAG -GGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAG -GCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCT -TTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACA -ACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAA -TGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGT -ACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTTCGCTGGGGACTTTCCA -GGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGC -AGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCT -CTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT ->MK115576.1 -AACAGACTCTGGTAAGTAGTGGTCCGCTCAAAATCTCTAGCAGTGGCGCCCGACTCTGGT -AACTAGAGATCCCTCAAAATCTCTAGCAGTGGCGCCCGATCAAAATCTCTAGCAGTGGCG -CCCGAGACTCTGGAACTAGAGATCCAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAG -AGATCCCTCAGTGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCC -CTCAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCAAATCTCTA -GCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCAGTGAAATCTCTAGCAGGAGCTCT -CTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGG -TGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGA -GCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGG -GGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTT -GCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTA -CAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTC -CTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTA -GAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGAC -ACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACAT -CAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTC -AGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTA -AACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACC -ATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCA -CCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAG -GAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGA -TGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGAT -ATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTA -AGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAA -AATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAG -GAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCT -GAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAAC -CAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGC -AGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGAC -TGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCA -GGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTT -GGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCC -TTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGC -AATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTT -TGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGAC -AGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAG -GACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAA -ATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCC -CAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTA -CAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTC -CAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAG -AACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAG -GGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTC -CCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGA -CACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAA -TATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAG -TTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATA -GAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACA -AAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGT -GGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGA -AGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAAT -TATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAG -CAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATT -ATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACAT -ATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGG -GTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAA -GCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGG -AGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATA -CCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAA -CTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCA -CTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGT -TACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACT -CACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCA -ATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCAC -ACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAG -TACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATT -GGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCA -GCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAG -GAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATG -TAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCAT -ACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCA -GCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAAT -TTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAA -AGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGG -CAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAA -GAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAA -AAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAG -CAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAG -TAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATG -ATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCAT -ATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCAT -CCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACA -TATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAA -TGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCAT -CTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATA -GTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTG -GCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAA -CTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACA -ATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTA -GGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAG -GAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGT -GTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGAT -CCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGC -TATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATC -TCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGAT -CAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCA -ATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATA -GAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAA -AGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATG -GAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTG -GGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGC -ATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGT -ACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACAT -GTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAG -CCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAA -TGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTG -CTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTA -TAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAA -CACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTA -TTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGG -ACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAAC -TCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTT -CACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTAC -AAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGC -AACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATG -GAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAAT -AATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGG -AGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTG -GACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGAT -TATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAAT -TAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGA -GACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATA -TAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAG -AGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGG -AGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTT -ATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACA -TCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGA -AAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTG -CACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGA -TAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACAC -CTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGA -TAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATT -ATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTAT -AGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCC -GAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAG -ATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTG -CCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACT -TCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGAT -TCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGA -GGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACC -TACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAA -AAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAG -CAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCA -ATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAG -TGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCG -ATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAA -GACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGA -ACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAG -TACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGA -GCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCC -TAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATT -GAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGG -GACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGG -GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCAC -TGCTTAAGCCTCAATAAAGCTTGCCT >OQ092466 GACGGCCGAGGTGGCTCTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGA TCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCC diff --git a/tests/expected-results-large-csv/orfs.csv b/tests/expected-results-large-csv/orfs.csv index e85fe8e..e886aad 100644 --- a/tests/expected-results-large-csv/orfs.csv +++ b/tests/expected-results-large-csv/orfs.csv @@ -1,158 +1,158 @@ seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides -KX505501.1,env,0,1824,6224,8795,forward,0.7626080297560442,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,env,0,1824,6223,8794,forward,0.7623480451210163,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG KX505501.1,vif,0,1824,5040,5619,forward,0.7647696476964769,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,nef,0,1824,8796,9417,forward,0.7645782478980201,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,tat_exon1,1,1750,5830,6046,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,nef,0,1824,8795,9416,forward,0.764345579086969,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,tat_exon1,1,1750,5829,6045,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT KX505501.1,gag,336,1824,789,2292,forward,0.3997973809613161,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon1,1306,1750,5969,6047,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT -KX505501.1,vpr,1599,1824,5558,5843,forward,0.7638478800047243,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon1,1306,1750,5968,6046,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,vpr,1599,1824,5558,5849,forward,0.763687959047407,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vpu,1599,1824,6060,6309,forward,0.7672672672672673,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG KX505501.1,pol,1627,1927,2084,5096,forward,0.7724330674761569,GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,IL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -KX505501.1,tat_exon2,1746,1824,8376,8469,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon2,1747,1927,8377,8653,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -KX505501.1,vpu,1748,1778,6259,6310,forward,0.7688723205964585,MHPEYYKDC,MHPEYYKDC*,ATGCATCCGGAGTACTACAAGGACTGCTGA +KX505501.1,tat_exon2,1746,1824,8375,8471,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon2,1747,1927,8376,8652,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA MN691959,gag,639,2142,789,2292,forward,0.0801186943620179,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN691959,pol,1934,4946,2084,5096,forward,0.054722889368558514,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN691959,vif,4890,5469,5040,5619,forward,0.09157509157509158,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG -MN691959,vpr,5408,5699,5558,5843,forward,0.5391891891891883,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MN691959,tat_exon1,5679,5898,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN691959,rev_exon1,5818,5899,5969,6047,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN691959,env,6070,8656,6224,8795,forward,0.13638128518734216,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA -MN691959,vpu,6105,6156,6259,6310,forward,0.2321981424148607,MGVEMGHHAPWDIDDL,MGVEMGHHAPWDIDDL*,ATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG -MN691959,tat_exon2,8237,8333,8376,8469,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA -MN691959,rev_exon2,8238,8514,8377,8653,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG -MN691959,nef,8657,9278,8796,9417,forward,0.08588605782994552,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA -MN692074,nef,0,4059,8796,9417,forward,0.763072203234748,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG -MN692074,env,2,4115,6224,8795,forward,0.7604257801108195,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpu,2,2084,6259,6310,forward,0.7659115426105717,MGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAA +MN691959,vpr,5408,5699,5558,5849,forward,0.09157509157509158,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MN691959,tat_exon1,5679,5898,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN691959,rev_exon1,5818,5899,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN691959,vpu,5910,6156,6060,6309,forward,0.7333193453629878,MQPIQIAIVALVVAIIIAIVV,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG +MN691959,env,6070,8656,6223,8794,forward,0.1405525502318391,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA +MN691959,tat_exon2,8237,8333,8375,8471,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA +MN691959,rev_exon2,8238,8514,8376,8652,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG +MN691959,nef,8657,9278,8795,9416,forward,0.06582796957284964,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA +MN692074,nef,0,4059,8795,9416,forward,0.7628009106462086,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG +MN692074,env,2,4115,6223,8794,forward,0.76033143808071,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA MN692074,gag,789,2292,789,2292,forward,0.19470123431286457,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN692074,pol,2084,4115,2084,5096,forward,0.5617851221088768,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA MN692074,vif,3617,4115,5040,5619,forward,0.7631664499349805,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpr,3617,4115,5558,5843,forward,0.7635778016363703,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,tat_exon1,3823,4084,5830,6046,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,rev_exon1,3823,4084,5969,6047,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,tat_exon2,4080,4164,8376,8469,forward,0.7699443413729128,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA -MN692074,rev_exon2,4081,4153,8377,8653,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG +MN692074,vpr,3617,4115,5558,5849,forward,0.7629151983204618,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpu,3617,4115,6060,6309,forward,0.7634058115037564,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,tat_exon1,3823,4084,5829,6045,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,rev_exon1,3823,4084,5968,6046,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,tat_exon2,4080,4164,8375,8471,forward,0.769292994661058,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,rev_exon2,4081,4153,8376,8652,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG MN692145,gag,775,2281,789,2292,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN692145,pol,2070,5085,2084,5096,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN692145,vif,5029,5608,5040,5619,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG -MN692145,vpr,5547,5838,5558,5843,forward,0.587876570313453,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG -MN692145,tat_exon1,5818,6037,5830,6046,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN692145,rev_exon1,5957,6038,5969,6047,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN692145,env,6212,8783,6224,8795,forward,0.47520309038232134,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MN692145,vpu,6253,6298,6259,6310,forward,0.3649167733674775,MEMGHHAPWDVDDL,MEMGHHAPWDVDDL*,ATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG -MN692145,tat_exon2,8364,8460,8376,8469,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -MN692145,rev_exon2,8365,8641,8377,8653,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG -MN692145,nef,8784,9387,8796,9417,forward,0.4049958673891082,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA +MN692145,vpr,5547,5838,5558,5849,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG +MN692145,tat_exon1,5818,6037,5829,6045,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6038,5968,6046,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6298,6060,6309,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8783,6223,8794,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8460,8375,8471,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8641,8376,8652,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9387,8795,9416,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA MN090335,gag,315,1665,789,2292,forward,0.596665989022159,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA MN090335,pol,1427,4469,2084,5096,forward,0.27887169154684477,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN090335,vif,4413,4992,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MN090335,vpr,4931,5222,5558,5843,forward,0.6083541998634192,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG -MN090335,tat_exon1,5202,5421,5830,6046,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA -MN090335,rev_exon1,5341,5422,5969,6047,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG -MN090335,env,5596,8158,6224,8795,forward,0.5139610675592354,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA -MN090335,vpu,5643,5682,6259,6310,forward,0.5690703735881842,MGHDAPWDVDDL,MGHDAPWDVDDL*,ATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG -MN090335,tat_exon2,7739,7835,8376,8469,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA -MN090335,rev_exon2,7740,8016,8377,8653,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG -MN090335,nef,8159,8813,8796,9417,forward,0.49485619884358334,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +MN090335,vpr,4931,5222,5558,5849,forward,0.3808935556928146,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG +MN090335,tat_exon1,5202,5421,5829,6045,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA +MN090335,rev_exon1,5341,5422,5968,6046,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG +MN090335,vpu,5433,5682,6060,6309,forward,0.5244381020335356,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG +MN090335,env,5596,8158,6223,8794,forward,0.5152420275849952,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA +MN090335,tat_exon2,7739,7835,8375,8471,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA +MN090335,rev_exon2,7740,8016,8376,8652,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG +MN090335,nef,8159,8813,8795,9416,forward,0.4891015417331206,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA MN090376,gag,522,1590,789,2292,forward,0.6828741441147701,MYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MHTIEDCYCIK**FKFL*SCLKCWL*LSQYLSTAF*CF*QARINCESFQFPACPYYMF*LISFLSPWP*PNFLPFV*FSPA*YRRSRTHLSPSSLR*SKRRTHRSPPLASCCARFSKPSPIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGCACACAATAGAGGACTGCTACTGTATTAAATAATGATTTAAGTTCCTCTGATCCTGTCTGAAGTGCTGGTTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCCAGTTCCCTGCTTGCCCATACTATATGTTTTAACTTATATCTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATTTGTCTAATTCTCCCCCGCTTAATACCGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAAGGCGTACTCACCGTTCGCCGCCCCTCGCCTCTTGCTGTGCGCGCTTCAGCAAGCCGAGTCCGATAATTCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA MN090376,pol,1382,4394,2084,5096,forward,0.23966680468616797,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTGACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAGACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGATGAGCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCTGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTCGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAG MN090376,vif,4338,4920,5040,5619,forward,0.42479043044174425,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAGCATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGACTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAAAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MN090376,vpr,4859,5150,5558,5843,forward,0.580763397371082,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCTTGGCTTCATGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MN090376,tat_exon1,5130,5349,5830,6046,forward,0.46628407460545196,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAA -MN090376,rev_exon1,5269,5350,5969,6047,forward,0.5763097949886105,MAGRSGDSDEELLRIAGTIKFLYQSSK,MAGRSGDSDEELLRIAGTIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAAG -MN090376,env,5524,8110,6224,8795,forward,0.4972760674014952,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAGGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAGCCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTAACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTAACATCAATAGCACTAATATAAACAATACCAATAGTATAGAAAGAGAAATGACAAACTGCTCTTTTAATGTCACCACAGTCATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAAACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGCTATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTAAAAATGTTAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAACACAGAAGTAAATATTATCACACTCCCATGCAAGATAAGGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACATTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -MN090376,vpu,5568,5631,6259,6310,forward,0.6063492063492064,MGNHAHLDMGHHAPWDVNDL,MGNHAHLDMGHHAPWDVNDL*,ATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA -MN090376,tat_exon2,7691,7784,8376,8469,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG -MN090376,rev_exon2,7692,7968,8377,8653,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG -MN090376,nef,8111,8735,8796,9417,forward,0.5093153589821267,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACATCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA +MN090376,vpr,4859,5150,5558,5849,forward,0.36116422349691957,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCTTGGCTTCATGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MN090376,tat_exon1,5130,5349,5829,6045,forward,0.46628407460545196,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAA +MN090376,rev_exon1,5269,5350,5968,6046,forward,0.5763097949886105,MAGRSGDSDEELLRIAGTIKFLYQSSK,MAGRSGDSDEELLRIAGTIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAAG +MN090376,vpu,5361,5631,6060,6309,forward,0.5680096940321115,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA +MN090376,env,5524,8110,6223,8794,forward,0.49863720871464445,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAGGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAGCCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTAACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTAACATCAATAGCACTAATATAAACAATACCAATAGTATAGAAAGAGAAATGACAAACTGCTCTTTTAATGTCACCACAGTCATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAAACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGCTATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTAAAAATGTTAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAACACAGAAGTAAATATTATCACACTCCCATGCAAGATAAGGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACATTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +MN090376,tat_exon2,7691,7784,8375,8471,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG +MN090376,rev_exon2,7692,7968,8376,8652,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MN090376,nef,8111,8735,8795,9416,forward,0.5036770338593534,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACATCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA MK115581.1,gag,680,2180,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115581.1,pol,1972,4984,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115581.1,vif,4928,5507,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115581.1,vpr,5446,5737,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115581.1,tat_exon1,5717,5936,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115581.1,rev_exon1,5856,5937,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115581.1,env,6111,8652,6224,8795,forward,0.4564898680537425,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115581.1,vpu,6149,6194,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115581.1,tat_exon2,8233,8329,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115581.1,rev_exon2,8234,8510,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115581.1,nef,8653,9268,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115581.1,vpr,5446,5737,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115581.1,tat_exon1,5717,5936,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115581.1,rev_exon1,5856,5937,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115581.1,vpu,5948,6194,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115581.1,env,6111,8652,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115581.1,tat_exon2,8233,8329,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115581.1,rev_exon2,8234,8510,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115581.1,nef,8653,9268,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115690.1,gag,777,2286,789,2292,forward,0.24076694150363465,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAGTGGGAAAAAATTCGGTTGAGGCCAGGGGGAAAGAAAAAATATAGATTAAAGCATATCGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATAATGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTGTATAATACAGTAGCAACCCTCTATTGTGTACATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGGCGCAGGAAACAGCAGTCAGACCAGCACCAGCCAAAATTACCCTATAGTACAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTCTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACTAATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCCACCAGCATTCTAGACATAAGACAAGGACCAAAGGAGCCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTAGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAGGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGTCATAAAGCAAGAGTTTTAGCGGAAGCAATGAGCCAAGCAACAAATTCAGCTGCCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAAAGTGTTAAGTGTTTTAATTGCGGCAAAGATGGGCACATAGCAAAAAATTGCAGGGCCCCTAGAAGAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTCCAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA MK115690.1,pol,2078,5090,2084,5096,forward,0.185747174550021,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGCACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATAGGGCCTGAGAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGACTTCAGAGAACTAAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGACAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAACCTTATAGAAAACAAAATCCAAACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACCTAGAAATAGGGCAGCATAGAATAAAAATAGAAGAACTGAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGACAAGTGGACAGTACAGCCTATAGCGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATCTACCCAGGAATTAAAGTAAGGCAATTATGTAAACTACTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAAAAGAAGCAGAGCTAGAATTAGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGAGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTGACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTGATATGGGGAAAGACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAATCAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTATCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACATGCAATTTATCTAGCTTTGCAAGATTCGGGATTAGAAGTAAATATAGTAACAGACTCACAGTATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTGTTTTTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAGCAGCATACTTTATTTTAAAATTAGCAGGACGATGGCCAGTAGCAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACAGTTAAGGCCGCCTGCTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAACAATGAATTGAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACGTAATAGCAACAGACTTACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAACATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115690.1,vif,5034,5613,5040,5619,forward,0.39766435115272314,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAAGATGGCACAGTTTAGTAAAACACCATATATATATTTCAGGGAAAGCTAGAGGATGGGTTTATAAACATCACTATGAAAACACTCATCCAAGAATAAGTTCAAAAGTATACATCCCACTAGGGGAAGCTAGACTGGCAGTAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGGAATATAGCACACAAGTAGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGTCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTTTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTATTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAG -MK115690.1,vpr,5552,5843,5558,5843,forward,0.5980919765166341,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*,ATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACACATCTATGAGACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAAGTCTGCAACAACTGCTGTTCATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGAATTACTCCACAGAGGAGAACAAGAAATGGAGCCAGTAGATCCTAA -MK115690.1,tat_exon1,5823,6042,5830,6046,forward,0.40192926045016075,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ*,ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAA -MK115690.1,rev_exon1,5962,6043,5969,6047,forward,0.524971623155505,MAGRSGDNDEDLLKTVRFIKLLYQSSK,MAGRSGDNDEDLLKTVRFIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAAG -MK115690.1,env,6217,8800,6224,8795,forward,0.4988789237668163,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*,ATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCTACAGACCCCAACCCACAAGAAATAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTACATTGCACTAAGTTGGAGATTAATAGCACTAAGAAGACTAATAGCACTAATAATGGTACTAACATCAATGCCACTGATGATAGTTGGGGGGAAATGAAAAACTGCTCTTTCAATACCACTGCAAGCATAAGAGATAAGGTACAGAGAGAATTTGCGCTTTTTTATAAACTTGATATAGTACCAATAGATAATGATGATATCAACTATAGGTTAATAAGTTGTAACACCTCAGTCCTTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAAAATTTCAATGGAACAGGACAATGTAAAAATGTCAGCACAGTGCAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTCAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAAATCTGAAAATATCACAGACAATACTAAAACTATAATAGTACAGCTGAATGCATCTGTAGCAATTGTTTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGGCCAGGGAGAGCGTTTTATGCAGCAGGAGATATAATAGGAGACATAAGACGAGCACACTGTATCCTTAACAAAACAACATGGGATAACACAATAGAACAGGTAGCTAAAAAATTAAGAGAACAATTTGAGAATAAGACAATAGTCTTTAGTGAATCCTCGGGAGGGGACCCAGAAATTACAATGATTAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAGTACAACTGTTTAATAGTACTTGGCATAATAATGGGAGTAGTACTACAGGGTCAAGTAGCAGTGAAGGCAATATCACACTCCCATGCAAAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACCAATTAGCTGCGAGTCAAATATTACAGGGTTGCTACTAACAAGAGATGGTGGGAATGACGCTAACGGGAACAACACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGCGAAGTGAATTATATAGATACAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCACAGAGAAGAGTGGTACAGAGAGAAAAAAGAGCAGTGGGTCTCGGAGCCTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGCTTTGGGGTTGCTCTGGAAAACTCATCTGCAACACTGCTGTGCCTTGGAATACTAGTTGGAGTAACAAATCTCTGGATGATATTTGGCATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAACATAATATACAGCTTAATTGAGGCATCGCAAACCCAGCAAGAAAAGAATGAACAAGAATTACTAGAATTAGACAAATGGGCAAGTCTGTGGAATTGGTTTAGCATATCAAACTGGCTGTGGTACATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTATACTTTCTATAGTGAATAGAGTTAGGAAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAGTGCTGTTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGAGTTATAGAAGGATTGCGCAGAGCTTTTAGAGCTATTATCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGAGCTTTGCAATAA -MK115690.1,vpu,6255,6300,6259,6310,forward,0.3649167733674775,MEMGHHAPWDVDDL,MEMGHHAPWDVDDL*,ATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG -MK115690.1,tat_exon2,8381,8474,8376,8469,forward,0.5303030303030303,RPTSQPRGDPTGPKEPETKVESKTETDPLT,RPTSQPRGDPTGPKEPETKVESKTETDPLT*,AGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAG -MK115690.1,rev_exon2,8382,8658,8377,8653,forward,0.42982806877249113,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE*,GACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAG -MK115690.1,nef,8801,9425,8796,9417,forward,0.46635769262600346,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*,ATGGGTGGTAAATGGTCAAAATGTAGTATAGTTGGATGGCCTACTGTAAGGGAAAGAATAAGACGAGCAGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAAGCATGGAGCAATCACAAGTAGCAATGCTAACAATGCTGATTGTACCTGGCTGGAAGCCCAAAAAGAAGAGGAGGAGGTAGGCTTTCCAGTCAGGCCTCAGGTACCCTTAAGACCAATGACTTACAAGGCAGCCTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAGGGTAGAAGAGGAGAATAAAAGAGAGAACCGCTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTACAGTGGAGGTTTGACAGCCGCCTAGCCTTTCACCACGTAGCCAGAGAGCTGCATCCGGAGTACTATAAGAACTAGAACTGCTGA +MK115690.1,vpr,5552,5843,5558,5849,forward,0.37688442211055273,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*,ATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACACATCTATGAGACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAAGTCTGCAACAACTGCTGTTCATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGAATTACTCCACAGAGGAGAACAAGAAATGGAGCCAGTAGATCCTAA +MK115690.1,tat_exon1,5823,6042,5829,6045,forward,0.40192926045016075,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ*,ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAA +MK115690.1,rev_exon1,5962,6043,5968,6046,forward,0.524971623155505,MAGRSGDNDEDLLKTVRFIKLLYQSSK,MAGRSGDNDEDLLKTVRFIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAAG +MK115690.1,vpu,6054,6300,6060,6309,forward,0.48542752364408415,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL*,ATGCAATCTTTAGCAATATTAGCAATAGTAGCATTAGTAGTAGCAGCCATAATAGCAATAGTTGTGTGGACCATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGATAGTGGCAATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG +MK115690.1,env,6217,8800,6223,8794,forward,0.49751604598034604,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*,ATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCTACAGACCCCAACCCACAAGAAATAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTACATTGCACTAAGTTGGAGATTAATAGCACTAAGAAGACTAATAGCACTAATAATGGTACTAACATCAATGCCACTGATGATAGTTGGGGGGAAATGAAAAACTGCTCTTTCAATACCACTGCAAGCATAAGAGATAAGGTACAGAGAGAATTTGCGCTTTTTTATAAACTTGATATAGTACCAATAGATAATGATGATATCAACTATAGGTTAATAAGTTGTAACACCTCAGTCCTTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAAAATTTCAATGGAACAGGACAATGTAAAAATGTCAGCACAGTGCAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTCAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAAATCTGAAAATATCACAGACAATACTAAAACTATAATAGTACAGCTGAATGCATCTGTAGCAATTGTTTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGGCCAGGGAGAGCGTTTTATGCAGCAGGAGATATAATAGGAGACATAAGACGAGCACACTGTATCCTTAACAAAACAACATGGGATAACACAATAGAACAGGTAGCTAAAAAATTAAGAGAACAATTTGAGAATAAGACAATAGTCTTTAGTGAATCCTCGGGAGGGGACCCAGAAATTACAATGATTAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAGTACAACTGTTTAATAGTACTTGGCATAATAATGGGAGTAGTACTACAGGGTCAAGTAGCAGTGAAGGCAATATCACACTCCCATGCAAAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACCAATTAGCTGCGAGTCAAATATTACAGGGTTGCTACTAACAAGAGATGGTGGGAATGACGCTAACGGGAACAACACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGCGAAGTGAATTATATAGATACAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCACAGAGAAGAGTGGTACAGAGAGAAAAAAGAGCAGTGGGTCTCGGAGCCTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGCTTTGGGGTTGCTCTGGAAAACTCATCTGCAACACTGCTGTGCCTTGGAATACTAGTTGGAGTAACAAATCTCTGGATGATATTTGGCATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAACATAATATACAGCTTAATTGAGGCATCGCAAACCCAGCAAGAAAAGAATGAACAAGAATTACTAGAATTAGACAAATGGGCAAGTCTGTGGAATTGGTTTAGCATATCAAACTGGCTGTGGTACATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTATACTTTCTATAGTGAATAGAGTTAGGAAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAGTGCTGTTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGAGTTATAGAAGGATTGCGCAGAGCTTTTAGAGCTATTATCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGAGCTTTGCAATAA +MK115690.1,tat_exon2,8381,8474,8375,8471,forward,0.4918032786885247,RPTSQPRGDPTGPKEPETKVESKTETDPLT,RPTSQPRGDPTGPKEPETKVESKTETDPLT*,AGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAG +MK115690.1,rev_exon2,8382,8658,8376,8652,forward,0.42982806877249113,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE*,GACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAG +MK115690.1,nef,8801,9425,8795,9416,forward,0.459649710885779,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*,ATGGGTGGTAAATGGTCAAAATGTAGTATAGTTGGATGGCCTACTGTAAGGGAAAGAATAAGACGAGCAGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAAGCATGGAGCAATCACAAGTAGCAATGCTAACAATGCTGATTGTACCTGGCTGGAAGCCCAAAAAGAAGAGGAGGAGGTAGGCTTTCCAGTCAGGCCTCAGGTACCCTTAAGACCAATGACTTACAAGGCAGCCTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAGGGTAGAAGAGGAGAATAAAAGAGAGAACCGCTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTACAGTGGAGGTTTGACAGCCGCCTAGCCTTTCACCACGTAGCCAGAGAGCTGCATCCGGAGTACTATAAGAACTAGAACTGCTGA MK115571.1,gag,579,2079,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115571.1,pol,1871,4883,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115571.1,vif,4827,5406,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115571.1,vpr,5345,5636,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115571.1,tat_exon1,5616,5835,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115571.1,rev_exon1,5755,5836,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115571.1,env,6010,8551,6224,8795,forward,0.4569687738004571,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115571.1,vpu,6048,6093,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115571.1,tat_exon2,8132,8228,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115571.1,rev_exon2,8133,8409,8377,8653,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115571.1,nef,8552,9167,8796,9417,forward,0.4756067663643049,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115571.1,vpr,5345,5636,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115571.1,tat_exon1,5616,5835,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115571.1,rev_exon1,5755,5836,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115571.1,vpu,5847,6093,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115571.1,env,6010,8551,6223,8794,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115571.1,tat_exon2,8132,8228,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115571.1,rev_exon2,8133,8409,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115571.1,nef,8552,9167,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115514.1,gag,584,2084,789,2292,forward,0.3014827756125966,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115514.1,pol,1876,4888,2084,5096,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115514.1,vif,4832,5411,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115514.1,vpr,5350,5641,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115514.1,tat_exon1,5621,5840,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115514.1,rev_exon1,5760,5841,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115514.1,env,6015,8556,6224,8795,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115514.1,vpu,6053,6098,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115514.1,tat_exon2,8137,8233,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115514.1,rev_exon2,8138,8414,8377,8653,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115514.1,nef,8557,9172,8796,9417,forward,0.4756067663643049,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115514.1,vpr,5350,5641,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115514.1,tat_exon1,5621,5840,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115514.1,rev_exon1,5760,5841,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115514.1,vpu,5852,6098,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115514.1,env,6015,8556,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115514.1,tat_exon2,8137,8233,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115514.1,rev_exon2,8138,8414,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115514.1,nef,8557,9172,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115488.1,gag,707,2207,789,2292,forward,0.3014827756125966,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115488.1,pol,1999,5011,2084,5096,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115488.1,vif,4955,5534,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115488.1,vpr,5473,5764,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115488.1,tat_exon1,5744,5963,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115488.1,rev_exon1,5883,5964,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115488.1,env,6138,8679,6224,8795,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115488.1,vpu,6176,6221,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115488.1,tat_exon2,8260,8356,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115488.1,rev_exon2,8261,8537,8377,8653,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115488.1,nef,8680,9295,8796,9417,forward,0.4756067663643049,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115488.1,vpr,5473,5764,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115488.1,tat_exon1,5744,5963,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115488.1,rev_exon1,5883,5964,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115488.1,vpu,5975,6221,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115488.1,env,6138,8679,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115488.1,tat_exon2,8260,8356,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115488.1,rev_exon2,8261,8537,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115488.1,nef,8680,9295,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115030.1,gag,176,1685,789,2292,forward,0.27304152847199525,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA MK115030.1,pol,1477,4489,2084,5096,forward,0.26443159013103534,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115030.1,vif,4433,5012,5040,5619,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG -MK115030.1,vpr,4951,5242,5558,5843,forward,0.594871162618666,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGACATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115030.1,tat_exon1,5222,5441,5830,6046,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115030.1,rev_exon1,5361,5442,5969,6047,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115030.1,env,5616,8217,6224,8795,forward,0.510440428145289,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAGAAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAATACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGAAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAACCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK115030.1,vpu,5660,5699,6259,6310,forward,0.6901936289818864,MGHLVPWDGDDM,MGHLVPWDGDDM*,ATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG -MK115030.1,tat_exon2,7798,7891,8376,8469,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG -MK115030.1,rev_exon2,7799,8075,8377,8653,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG -MK115030.1,nef,8218,8860,8796,9417,forward,0.5478186258332784,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATACTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115030.1,vpr,4951,5242,5558,5849,forward,0.3566796368352788,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGACATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115030.1,tat_exon1,5222,5441,5829,6045,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115030.1,rev_exon1,5361,5442,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK115030.1,vpu,5453,5699,6060,6309,forward,0.5682727709300466,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM*,ATGCATATCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK115030.1,env,5616,8217,6223,8794,forward,0.5091484869809996,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAGAAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAATACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGAAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAACCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115030.1,tat_exon2,7798,7891,8375,8471,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK115030.1,rev_exon2,7799,8075,8376,8652,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK115030.1,nef,8218,8860,8795,9416,forward,0.5432971135257649,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATACTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA MK115498.1,gag,663,2163,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115498.1,pol,1955,4967,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115498.1,vif,4911,5490,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115498.1,vpr,5429,5720,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115498.1,tat_exon1,5700,5919,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115498.1,rev_exon1,5839,5920,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115498.1,env,6094,8635,6224,8795,forward,0.4564898680537425,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115498.1,vpu,6132,6177,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115498.1,tat_exon2,8216,8312,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115498.1,rev_exon2,8217,8493,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115498.1,nef,8636,9251,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115498.1,vpr,5429,5720,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115498.1,tat_exon1,5700,5919,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115498.1,rev_exon1,5839,5920,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115498.1,vpu,5931,6177,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115498.1,env,6094,8635,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115498.1,tat_exon2,8216,8312,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115498.1,rev_exon2,8217,8493,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115498.1,nef,8636,9251,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115211.1,gag,250,1753,789,2292,forward,0.25132972351334526,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAGATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAAGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACACAGGACATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCATTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAGCCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAAACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAAATGCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA MK115211.1,pol,1545,4557,2084,5096,forward,0.2540106951871657,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAGAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCTGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATTTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTACCACCTGTAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGGCAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGTAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA MK115211.1,vif,4501,5083,5040,5619,forward,0.40472673559822736,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MK115211.1,vpr,5022,5313,5558,5843,forward,0.5885636318531382,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAACTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGGGCAAGAAATGGAGCCAGTAGATCCTAG -MK115211.1,tat_exon1,5293,5512,5830,6046,forward,0.4691531785127845,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAAGACTGCTTGCACCAGTTGCTATTGTAAAAGGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA -MK115211.1,rev_exon1,5432,5513,5969,6047,forward,0.564475664826894,MAGRSGDSDEELLRITRTIKFLYQNSE,MAGRSGDSDEELLRITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG -MK115211.1,env,5687,8198,6224,8795,forward,0.6631820277358986,MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACCCAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTACTATAAACAATACCAGTAGTATAGAAGAAGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCGCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTAGGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACACTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGTAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -MK115211.1,vpu,5731,5794,6259,6310,forward,0.6405797101449275,MGNHAHLGMGHHAPWEVNDL,MGNHAHLGMGHHAPWEVNDL*,ATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA -MK115211.1,tat_exon2,7779,7872,8376,8469,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG -MK115211.1,rev_exon2,7780,8056,8377,8653,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG -MK115211.1,nef,8199,8823,8796,9417,forward,0.5148270181219111,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACCCAGATAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA +MK115211.1,vpr,5022,5313,5558,5849,forward,0.3808935556928146,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAACTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGGGCAAGAAATGGAGCCAGTAGATCCTAG +MK115211.1,tat_exon1,5293,5512,5829,6045,forward,0.4691531785127845,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAAGACTGCTTGCACCAGTTGCTATTGTAAAAGGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA +MK115211.1,rev_exon1,5432,5513,5968,6046,forward,0.564475664826894,MAGRSGDSDEELLRITRTIKFLYQNSE,MAGRSGDSDEELLRITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG +MK115211.1,vpu,5524,5794,6060,6309,forward,0.5776066350710902,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTATTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA +MK115211.1,env,5687,8198,6223,8794,forward,0.6638103647692366,MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACCCAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTACTATAAACAATACCAGTAGTATAGAAGAAGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCGCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTAGGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACACTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGTAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +MK115211.1,tat_exon2,7779,7872,8375,8471,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG +MK115211.1,rev_exon2,7780,8056,8376,8652,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MK115211.1,nef,8199,8823,8795,9416,forward,0.5093153589821267,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACCCAGATAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA MK115158.1,gag,316,1819,234,1731,forward,0.38499312512276596,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAACAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACCCAGGAAATAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCTTTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACGATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAACCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA MK115158.1,pol,1611,4623,1526,4535,forward,0.30843043180260443,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTCTACCAGGAAGATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATGGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTGCATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCTCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACTTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAGGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAGGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA MK115158.1,vif,4567,5149,4479,5061,forward,0.48399487836107546,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGTTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACGGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG @@ -167,58 +167,58 @@ MK115158.1,nef,8316,8940,8213,8834,forward,0.5254870367657829,MGGIFSKRNGGGWPAIRE MK114705.1,gag,532,2047,789,2292,forward,0.27270615563298484,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGCGAATTAGATAGATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCGGTTAATCCTGGCCTGTTAGAAACATCAGAGGGCTGTAGGCAAATACTGGGACAGCTACAACCGTCCCTTCAAACAGGATCAGAAGAACTTAAATCATTATTTAATACAATAGCAGTCCTTTATTGCGTACATCAAAGGATAGATGTAAAAGACACCAAGGAAGCTCTAAATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGTCAGAGCAGTCAAGTCAGCCAAAATTACCCTATAGTGCAGAACCATCAGGGGCAAATGGTATATCAGGCTCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCCGAGGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAGGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGGACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCATGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTATCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCTTTTAGAGATTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAAGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTCTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCAGCCACAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGCAACAGGTGGTGCAACTAACATAATGATGCAGAAAGGCAATTTTAGGAACCAAGGAAAACCTATTAAGTGTTTCAATTGTGGCAAAGAAGGGCACCTAGCTAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCTCTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAA MK114705.1,pol,1839,4851,2084,5096,forward,0.21944123990570308,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTAAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAACCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCCGTATTTGCCATAAAGAAAAAGGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAGCTTAATAAAAGAACTCAAGACTTTTGGGAGGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTCTCAGTTCCTTTAGATGAAAGCTTCAGAAAGTATACTGCATTTACCATACCTAGTACTAACAATGAGACACCCGGGATTAGGTATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTTCAAAGTAGCATGACGAAAATCTTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTACCAATACATGGATGATTTATACGTAGGATCTGACTTAGAAATAGAGCAGCATAGAGCAAAAGTAGAGAACCTGAGAGAGCATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAGCATCAGAAAGAACCTCCATTTCTTTGGATGGGCTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAGCTAAGGCACTAACAGAAGTGATAACACTAACAGAAGAAGCAGAGCTAGAATTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAGTAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACCTATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAAGCAGTTCAAAAAATAGCCACAGAGAGCATAGTAGTATGGGGAAAGATTCCTAAATTTAGATTACCCATACAGAAAGAAACATGGGAAACATGGTGGATGGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAGTACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGGCAAAAAGTTATCCCCTTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGACAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAGAAGGTCTACCTGACATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCAGGAATCAGGAAAATACTATTTTTGGATGGAATAGATAAGGCCCAGGAAGATCATGAGAAATATCATAGTAATTGGAAAGCAATGGCTAGTGATTTTAACATACCACCTGTGGTAGCAAAAGAGATAATAGCCAGCTGTGATAAATGTCAGCTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTCCATGTAGCCAGTGGGTACATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAATAATACATACAGATAATGGTAGCAATTTCACCAGCACTACAGTCAAGGCCGCCTGCTGGTGGGCAGGTGTTAAGCAGGAGTTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTGGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGAGTACTGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTGCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATCAAAGTAGTACCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK114705.1,vif,4795,5374,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTCTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGGTTTACAGACACCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAACACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATATGTACTATTTTGATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTGCAATACCTGGCACTAGCAGTATTAGTAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTCGCGAGACTGACAGAGGATAGATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAG -MK114705.1,vpr,5313,5598,5558,5843,forward,0.5871212121212123,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*,ATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAGCTTAAGAGGGAAGCTGTTAGACATTTTCCTAGGGAATGGCTCCATAGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGGCAGGAGTAGGAGCCATAATAAGAATACTGCAACAATTACTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGGATAGGCATACTGAGGAGAACAAGAAATGGAGCCCGTAGATCCTAG -MK114705.1,tat_exon1,5578,5797,5830,6046,forward,0.5138258357408172,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ*,ATGGAGCCCGTAGATCCTAGACTGGAACCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTAACAATTGCTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGCTTCACAAAAAAGGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAA -MK114705.1,rev_exon1,5717,5798,5969,6047,forward,0.5940834141610087,MAGRSGDRDEDLLETVRFIKFLYQNSK,MAGRSGDRDEDLLETVRFIKFLYQNSK,ATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAAG -MK114705.1,env,5972,8549,6224,8795,forward,0.49969138043715056,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*,ATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAGTGCTACAAACATGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGATGCAACCACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGATACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCGACCCACAAGAAGTAGTACTGGAAAATGTGACAGAAAATTATAATATGGGAAAAAATAACATGGTGGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTACTCTTAACCCCATTCTGTGTCACTTTAAATTGCACTGATGCTAACATCACCAGCACTAATAATAGTAGAGATAAGAAGGAAGGAGAAAGTACATTGGAGGAGACGAAAGGAGAAATAAAAAACTGCTCTTTCAATATGACTTCAAGCATGAGCGATAAGTCTCAGAAACAACGTGCACTTTTTTATAAGCTTGATGTGGTACAAATAGATGAGACTAATAATAATAGTTATAGGTTGATAAGTTGTAACACCTCAGTCGTCACACAGGCTTGTCCAAAGGTATCCTTTGATCCAATCCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATAATAAGAAATTCAATGGAACAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAACCTGTAGTGTCAACCCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAAGTAATGATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTGCAGCTGAAGACACCTGTACAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGGATAAGTATGGGACCAGGGAGAGTAATTTATGCAACAGGACAAATAATAGGAGATATAAGAAAAGCACATTGCAACATTAGTAGAGCAGAATGGAATACAACTTTAAAGCAGATAGTTACACAATTAAGAAAGCAGTGGAATAGAACCATAATCTTTAACTCATCCTCAGGAGGGGACCCAGAAATTGTGATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACAAAACTATTTAATAGTACTTGGCCACGTAATAGTACTTGGAATAATACTGAAGGGTCAAATGACACTGAAATAATCACACTCCCGTGCAGAATAAAACAAATTGTAAACAGGTGGCAGGAAGTAGGCAAAGCAATGTATGCCCCTCCCATCCAAGGACAAATTAGTTGTTCATCAAATATTACAGGGCTGCTACTAGTTAGAGATGGTGGAATTAACACCAGTGAGAGCAACGAGACCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATGCTGGGAGCTATGTTCCTTGGGCTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGTTGACGGTACAGACCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGACTCCTAGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAACACTAGTTGGAGTAATAGATCTTATGAAGATATTTGGAACAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAGGCTTAATATACACCTTAATTGAAAAATCGCAGAACCAGCAGGAAATAAATGAACAAGAACTATTGTCATTGGATAAGTGGGCAAGCCTGTGGAATTGGTTTAATATAACAAATTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAGTGCTATCAGCTTGCTCAACGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGAATCATAGGAGTAGTACAAAGAACTTGGAGAGCTTTTATCCACATACCTAGGAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MK114705.1,vpu,6010,6055,6259,6310,forward,0.5970755483346872,MEMGRLAPWNVDDL,MEMGRLAPWNVDDL*,ATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG -MK114705.1,tat_exon2,8130,8226,8376,8469,forward,0.6074396517609815,RPPAQPQGDPTGPKKSKKEVEKETETDQCD,RPPAQPQGDPTGPKKSKKEVEKETETDQCD**,AGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGA -MK114705.1,rev_exon2,8131,8407,8377,8653,forward,0.47688921496698455,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE*,GACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAG -MK114705.1,nef,8550,8985,8796,9417,forward,0.6054615099468668,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*,ATGGGTGGAAAATGGTCAAAAAAGAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAAAATGAAGCGAACTGAGCCAGCAGCAGAGGGGGTGGGAGCAGCATCTCGAGACCTGGACAAATATGGAGCAATCACAAGTAGCAATACAGCACAGACCAATCCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAAGAGGTAGGCTTTCCAGTCAGACCCCAGGTACCTTTGAGACCAATGACTTACAAGGCAGCTGTGGATATGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAGAGACAAGATATCCTTGATCTGTGGATCTATCACACACAAGGCTACTTCCCTGATTGGCAAAATTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGAGGGTGCTTCAAGTAG +MK114705.1,vpr,5313,5598,5558,5849,forward,0.39401343921808174,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*,ATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAGCTTAAGAGGGAAGCTGTTAGACATTTTCCTAGGGAATGGCTCCATAGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGGCAGGAGTAGGAGCCATAATAAGAATACTGCAACAATTACTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGGATAGGCATACTGAGGAGAACAAGAAATGGAGCCCGTAGATCCTAG +MK114705.1,tat_exon1,5578,5797,5829,6045,forward,0.5138258357408172,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ*,ATGGAGCCCGTAGATCCTAGACTGGAACCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTAACAATTGCTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGCTTCACAAAAAAGGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAA +MK114705.1,rev_exon1,5717,5798,5968,6046,forward,0.5940834141610087,MAGRSGDRDEDLLETVRFIKFLYQNSK,MAGRSGDRDEDLLETVRFIKFLYQNSK,ATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAAG +MK114705.1,vpu,5809,6055,6060,6309,forward,0.5727186311787074,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL*,ATGCAACCTTTAGAGATATCAGCAATAGTAGCATTAGTAGTAGTAGCAATAATAGCAATAGTTGTGTGGACCATAGTACTCTTAGAGTATAGGAAAATATTAAGGCAAAAGAAAATAGACAGATTAATTAATAGAATAAGTGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG +MK114705.1,env,5972,8549,6223,8794,forward,0.5021538905210794,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*,ATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAGTGCTACAAACATGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGATGCAACCACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGATACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCGACCCACAAGAAGTAGTACTGGAAAATGTGACAGAAAATTATAATATGGGAAAAAATAACATGGTGGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTACTCTTAACCCCATTCTGTGTCACTTTAAATTGCACTGATGCTAACATCACCAGCACTAATAATAGTAGAGATAAGAAGGAAGGAGAAAGTACATTGGAGGAGACGAAAGGAGAAATAAAAAACTGCTCTTTCAATATGACTTCAAGCATGAGCGATAAGTCTCAGAAACAACGTGCACTTTTTTATAAGCTTGATGTGGTACAAATAGATGAGACTAATAATAATAGTTATAGGTTGATAAGTTGTAACACCTCAGTCGTCACACAGGCTTGTCCAAAGGTATCCTTTGATCCAATCCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATAATAAGAAATTCAATGGAACAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAACCTGTAGTGTCAACCCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAAGTAATGATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTGCAGCTGAAGACACCTGTACAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGGATAAGTATGGGACCAGGGAGAGTAATTTATGCAACAGGACAAATAATAGGAGATATAAGAAAAGCACATTGCAACATTAGTAGAGCAGAATGGAATACAACTTTAAAGCAGATAGTTACACAATTAAGAAAGCAGTGGAATAGAACCATAATCTTTAACTCATCCTCAGGAGGGGACCCAGAAATTGTGATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACAAAACTATTTAATAGTACTTGGCCACGTAATAGTACTTGGAATAATACTGAAGGGTCAAATGACACTGAAATAATCACACTCCCGTGCAGAATAAAACAAATTGTAAACAGGTGGCAGGAAGTAGGCAAAGCAATGTATGCCCCTCCCATCCAAGGACAAATTAGTTGTTCATCAAATATTACAGGGCTGCTACTAGTTAGAGATGGTGGAATTAACACCAGTGAGAGCAACGAGACCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATGCTGGGAGCTATGTTCCTTGGGCTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGTTGACGGTACAGACCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGACTCCTAGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAACACTAGTTGGAGTAATAGATCTTATGAAGATATTTGGAACAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAGGCTTAATATACACCTTAATTGAAAAATCGCAGAACCAGCAGGAAATAAATGAACAAGAACTATTGTCATTGGATAAGTGGGCAAGCCTGTGGAATTGGTTTAATATAACAAATTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAGTGCTATCAGCTTGCTCAACGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGAATCATAGGAGTAGTACAAAGAACTTGGAGAGCTTTTATCCACATACCTAGGAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MK114705.1,tat_exon2,8130,8226,8375,8471,forward,0.6074396517609815,RPPAQPQGDPTGPKKSKKEVEKETETDQCD,RPPAQPQGDPTGPKKSKKEVEKETETDQCD**,AGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGA +MK114705.1,rev_exon2,8131,8407,8376,8652,forward,0.47688921496698455,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE*,GACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAG +MK114705.1,nef,8550,8985,8795,9416,forward,0.6017710152157637,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*,ATGGGTGGAAAATGGTCAAAAAAGAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAAAATGAAGCGAACTGAGCCAGCAGCAGAGGGGGTGGGAGCAGCATCTCGAGACCTGGACAAATATGGAGCAATCACAAGTAGCAATACAGCACAGACCAATCCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAAGAGGTAGGCTTTCCAGTCAGACCCCAGGTACCTTTGAGACCAATGACTTACAAGGCAGCTGTGGATATGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAGAGACAAGATATCCTTGATCTGTGGATCTATCACACACAAGGCTACTTCCCTGATTGGCAAAATTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGAGGGTGCTTCAAGTAG MK114856.1,gag,120,2022,789,2292,forward,0.7511039743075072,MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC,MLHISSCFLPVLGLSGWTRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSGSNLVQPERPSSSGARTGT*KRK*NQRRSLDAGLGLLKRARQEAKGGDW*VRHF*LAEARRRKIGARASVLSRGELDR*EKIQLRPRRKKKYRLKHIV*ASKELERFAVNPGLLETSGGCKQILEQLQPSLQTRSEELRSLYNTVATLYYVHQKIDVKDTKEALDKVEEEQNKSKKKAQQAAADTRNRGQTSQNFPIVQNLQGQIVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVSRHQAAMQMLKKVINEEAAE*DRLHPVHARPIAPGQIREPKRSDIARTTSTLQEQIR*MTHNPPIPVRKIYKR*IILGLNKIVKMYSPTSILDIKQRPKEPFRDYVDQFYKTLRAKQATQKVKN*MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC*KYRKERHQMKNCTKRQANFLKKIWPSHKGRPENFPQSRPEIPQSRPEPTAPPAPPEKSFKFEEATTPSQKQETIDKELYPLTSLRSLFGNDPSSQ*,ATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTGGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGTTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGGCTCAAATCTGGTCCAACCAGAGAGACCCAGTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAAAGGCGGCGACTGGTGAGTACGCCATTTTTGACTAGCAGAGGCTAGAAGGAGAAAGATAGGTGCGAGAGCGTCAGTATTGAGCAGAGGAGAATTAGATAGATAGGAGAAAATTCAGTTAAGGCCAAGGAGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAAGGAACTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGGAGGCTGTAAACAGATATTAGAACAGCTACAACCATCCCTTCAGACAAGATCAGAAGAACTTAGATCATTATATAATACAGTAGCCACCCTCTATTATGTACATCAAAAGATAGATGTAAAAGACACCAAAGAAGCGTTAGACAAAGTAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCGGCAGCTGACACAAGAAACAGAGGCCAGACCAGTCAAAATTTCCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAGGCCATATCACCTAGAACTTTAAATGCATAAGTAAAAGTAGTAGAAGAAAAAGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACTATGCTAAACACAGTAAGTAGACACCAAGCAGCTATGCAAATGTTAAAAAAGGTCATCAATGAAGAAGCTGCAGAATAAGATAGATTACATCCAGTGCATGCAAGGCCTATTGCACCAGGCCAGATAAGAGAACCAAAAAGAAGTGACATAGCAAGAACTACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAAGAAAGATTTATAAAAGATAAATAATTCTAGGACTAAATAAAATAGTAAAAATGTATAGCCCTACCAGCATTTTAGACATAAAGCAAAGGCCAAAAGAACCCTTTAGAGACTATGTAGACCAGTTCTATAAAACTTTAAGAGCCAAGCAAGCTACACAGAAAGTAAAAAATTAGATGACAAAAACCTTGTTAGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAAAAAGTAAGAAGACCCGGCCATAAAGCAAAAGTTTTAGCTGAAGCAATGAGCCAAGCAACAGGTGCAGCCAACATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAAAGCACATAGCCAAAAATTGCAAGGCCCCTAAGAAAAAAGGCTGTTAGAAATATAGAAAAGAAAGACACCAAATGAAAAATTGCACTAAGAGACAGGCTAATTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA MK114856.1,pol,1787,4826,2084,5096,forward,0.7637180771917039,ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI,FFKENLAFPQRKARELSSKPTRNSSEQTRANSPTSPSRKELQV*RSNNSLSEAGDNRQGAVSSNFPQITLWQRPIVTIKIREQLKKALLNTGADDTVLEDIDLPRK*KPKMIRRIRSFIKVRQYEQVPIEISRHKAISTVLVGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPRMDGPKVKQ*PLTEEKIKALVEICTEIEKEKKISKIRPENPYNTPVFAIKKKDGTK*KKLVDFRELNKKTQDF*EIQLSIPHPAKLKKKKSVTVLDVGDAYFSVPLDKDFKKYTAFTIPSINNETPKIRYQYNVLPQR*KRSPAIFQSSMTKILEPFRKTNPDIVIYQYIDDLYVRSDLEIRQHRTKVKELRQHLMR*RFTTPDKKHQKEPPFL*MRYELHPDKWTVQPIVLPEKES*TVNDIQKLVRKLN*ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI*RRTPKFRLPIQKET*ET*WTDYWQAT*IPK*EFVNTPPLVKL*YQLEKEPIIRAETFYVDKAANKDNKSRKARYVTDRRRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKKKVYLA*VPAHKRIKRNEQVNKLVSARIKKVLFLDKIEKAQEDHKKYHSN*RTMASNFNLPPIVAKEIVASCDKCQLKKEAMHRQVDCSPGIWQLDCTHLEEKIILVAVHVASRYIEAEVIPAETRQETAYFILKLARRWPVKTIHTDNGRNFTSNTVKAAC**AKIKQEFSIPYNPQSQEVVKSINNELKKIIRQVKDQAKHLKTAVQMAVFIHNFKRKGGIEGYSAEERIVDIIATEIQTKELQKQITKIQNFQVYYKDSRDPL*KGPAKLLWKGEKAVVIQDNSDIKVVPRRKAKIIKDYKKQMASDDCVASRQDED*,TTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAAGAGAGCAACTAAAGAAAGCTTTATTAAATACAGGAGCAGATGATACAGTATTAGAAGACATAGATTTGCCAAGAAAATAGAAACCAAAAATGATAAGAAGAATTAGAAGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCAGACACAAAGCTATAAGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTAGAAGAAATCTGTTGACTCAGCTTAGTTGCACTCTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAAGAATGGACGGCCCAAAAGTTAAACAATAGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATAGAAAAAGAAAAGAAAATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATAGAAAAAATTAGTAGATTTCAGAGAACTTAATAAGAAAACTCAAGATTTCTAAGAAATTCAATTAAGTATACCACATCCTGCAAAGCTAAAAAAGAAAAAATCAGTCACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAAGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAAAGATTAGATATCAGTATAATGTGCTTCCACAAAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTAGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAAGGCAACATAGAACAAAAGTAAAGGAACTGAGGCAACATCTAATGAGGTAAAGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTAGATGAGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAAGAAAGTTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAATTGAATTAGGCAAGTCAGATTTATGCAAAGATTAAAGTGAAGCAATTATGTAAGCTCCTTAAAAGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAAAGATTCTAAAAGATCCAGTACATAGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAAAGAGAAGGTCAGTGGACATATCAAATTTATCAAAAGCCATTTAAAAATCTAAAAACAGAGAAATATGCAAGAACGAAAGGTGCCCATACTAATGATGTAAAGCAATTAACAGAAGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATAAAGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATAAGAAACATAGTGGACAGATTATTGGCAAGCCACCTAGATCCCTAAGTAAGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATAGTACCAGTTAGAAAAAGAACCCATAATAAGAGCAGAAACCTTCTATGTAGATAAGGCAGCTAATAAAGATAATAAATCAAGAAAAGCAAGATATGTTACTGACAGAAGAAGACAAAAAGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAAGATTCAGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAAAGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGAAAAAAGTCTACCTGGCATAAGTGCCAGCCCACAAAAGAATTAAAAGAAATGAACAGGTAAATAAACTAGTCAGTGCTAGAATCAAGAAAGTACTATTTTTAGATAAAATAGAAAAAGCCCAAGAAGACCATAAAAAATATCACAGTAATTAAAGAACAATGGCTAGTAATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAAAAGAAGCTATGCATAGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAAGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAAGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTAGTAGGCAAAAATCAAGCAAGAATTTAGTATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAAAATCTATAAATAATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAG MK114856.1,vif,4425,5349,5040,5619,forward,0.7566838361540349,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK,MN*RKL*DK*KIRLNILRQQYKWQYSSTILKEKGGLKDTVQRKE**T**QQKYRLKNYKNKLQKFKIFRFITRTAEIHFRKDQQSFSGKVKRQ**YKITVT*K*CQEEKQKSLRIIKNRWQVMIVWQVDRMKIRTWKSLVKYHMYISKKAKK*AYRHHYETTHPRISSEVHIPLGGARLVITTY*GLHTGEKDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVRSLQYLALTALITPKKIKPPLPSVKKLTEDR*NKPQKTKGHRKSHTMNRH*,ATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAGAAATAGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGAGGTGCTAGATTAGTAATAACAACATATTAAGGTCTGCATACAGGAGAAAAAGACTGGCATTTAGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAG -MK114856.1,vpr,5033,5579,5558,5843,forward,0.7661862444925697,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*,ATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAAACCTAAGACAATATATCTATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAG -MK114856.1,tat_exon1,5486,5780,5830,6046,forward,0.7619181418001311,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVN,ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAAT -MK114856.1,vpu,5486,6206,6259,6310,forward,0.7713277742142399,MRYLCKEMQIPLYSVHQMLKHMIQKYIMFRPHMPVYPQTLTHMK,MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVNNTCNATFKDISNSSISSSSNNSNSCVDHSRHKI*ENIKTKKNR*NN**NKKKSRRQWQ*ERKRSGRIVSTCSRNKARCSLRC**SVVLRKICKSQSIMRYLCKEMQIPLYSVHQMLKHMIQKYIMFRPHMPVYPQTLTHMK*,ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAATAATACATGTAATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAG -MK114856.1,rev_exon1,5698,5779,5969,6047,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAA -MK114856.1,env,5953,8521,6224,8795,forward,0.7529994904340572,MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD,MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*,ATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTAGAAAAATAACATGGTAGACCAGATGCATGAGGATATAATCAATTTATGAGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAAAAATAATACTGTAGGAAATCAAACAAATTATCATCTCAATGAAACTAATACAATACAAAGAAAAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAATATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAAAGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTAGTTTTGCAATTCTAAAGTGTAAAGATGAGATGTTCAATAGAACAAGACCATGTAAGAATGTCAGCACAGTACAATGTACACATAGAATTAGACCAGTAGTGTCAACTCAACTGCTGTTAAATAGTAGCCTAGCAGAAAAAAAGATAGTACTTAGATCTGAAAATTTCACAGACAATACTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAAAGAGAGCAATTTATGCAACAAGACAGATAATAGAAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGAAGTGACACTTTAAGCAAAATAGTTGAAAAATTAAAGGAAAAATTTAGAAAAAATAAAACAATAATCTTTAAGCAATCATCAAGAGAGGACATAGAAATTGAAACGCACAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGAAGTGTTAATAGAACTAGCATAAACAGAACTAACAATAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATCAACAGGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCTATCAGTAAGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATAGTAGTACAACTAATAGTAAAGAAGAGACCTTCAGACCTAGAGAAAGAAATATGAAGGACAATTAGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAAAAGTAGCACCCACCAAGGCACAAAGAAAAGTAGTGCAGAGAGAAAAAAGAGCAATAAGAACGTTAGGAGCTATGTTCCTCAGGTTCTTAAGAACAGCAGGAAGCACTATAGGCGCAGCGTCACTGACGCTGACAGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTAAGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTAGAAAGATACCTACAAGATCAACAGCTCCTGAAGATTTGAAGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATACTAGTTAGAGCAATAAATCTTACAGTACCATCTAAGATAACATGACCTAGATGCAGTAGGACAGAGAAATTCAAAATTACACAAAGATAATATACAACTTACTTAAAGAATCGCAAATCCAACAGAAAAAGAATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAA -MK114856.1,nef,7916,9176,8796,9417,forward,0.7587548638132295,MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MKKNY*N*INEQICRISLV*QNGYSI*KYS****EA**V*K*FLLYFL**IELGKDTHHYHCRPSSQPQEDQTGPKE*KKKVKRETEADPED**LDSYHSSKTTCKACAFSATTT*KTYS*LC*RLCKF*DTRSKRSSSTSRVSCSIKFRN*RIVLLACSIP*LSQ*LKEQIKL*K*DKKLAELFSTYLER*DKA*KRLCNKISGK*SKSCMAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAAAATAAGTGGCAAGTAGTCAAAAAGTTGTATGGCTAGATAGCCTGCTGTAAAAGAAAGAATAGAAAGAGTTAATCCAAGGCCTGCTGCAAAGAAAGAACAAGCTGAGCCAGCAGCAGCTAAGGTAAGAGCAGCATCTCGAGACTTAGAAAAATATAGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTAGCTAGAAGCACAAGAGGAAGAAGAAGTAGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTAAATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTAGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGAAATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATAGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA -MK114856.1,tat_exon2,8102,8198,8376,8469,forward,0.7134052388289676,RPSSQPQEDQTGPKE,RPSSQPQEDQTGPKE*KKKVKRETEADPED**,AGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGA -MK114856.1,rev_exon2,8103,8379,8377,8653,forward,0.6888374145157732,ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE,DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE*,GACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAG +MK114856.1,vpr,5033,5579,5558,5849,forward,0.7334692430420138,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*,ATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAAACCTAAGACAATATATCTATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAG +MK114856.1,tat_exon1,5486,5780,5829,6045,forward,0.7619181418001311,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVN,ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAAT +MK114856.1,rev_exon1,5698,5779,5968,6046,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAA +MK114856.1,vpu,5790,6039,6060,6309,forward,0.7407973896196594,MQPLKILAIVALVVAAIIAIVV,MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL*,ATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAG +MK114856.1,env,5953,8521,6223,8794,forward,0.7529994904340572,MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD,MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*,ATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTAGAAAAATAACATGGTAGACCAGATGCATGAGGATATAATCAATTTATGAGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAAAAATAATACTGTAGGAAATCAAACAAATTATCATCTCAATGAAACTAATACAATACAAAGAAAAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAATATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAAAGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTAGTTTTGCAATTCTAAAGTGTAAAGATGAGATGTTCAATAGAACAAGACCATGTAAGAATGTCAGCACAGTACAATGTACACATAGAATTAGACCAGTAGTGTCAACTCAACTGCTGTTAAATAGTAGCCTAGCAGAAAAAAAGATAGTACTTAGATCTGAAAATTTCACAGACAATACTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAAAGAGAGCAATTTATGCAACAAGACAGATAATAGAAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGAAGTGACACTTTAAGCAAAATAGTTGAAAAATTAAAGGAAAAATTTAGAAAAAATAAAACAATAATCTTTAAGCAATCATCAAGAGAGGACATAGAAATTGAAACGCACAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGAAGTGTTAATAGAACTAGCATAAACAGAACTAACAATAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATCAACAGGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCTATCAGTAAGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATAGTAGTACAACTAATAGTAAAGAAGAGACCTTCAGACCTAGAGAAAGAAATATGAAGGACAATTAGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAAAAGTAGCACCCACCAAGGCACAAAGAAAAGTAGTGCAGAGAGAAAAAAGAGCAATAAGAACGTTAGGAGCTATGTTCCTCAGGTTCTTAAGAACAGCAGGAAGCACTATAGGCGCAGCGTCACTGACGCTGACAGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTAAGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTAGAAAGATACCTACAAGATCAACAGCTCCTGAAGATTTGAAGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATACTAGTTAGAGCAATAAATCTTACAGTACCATCTAAGATAACATGACCTAGATGCAGTAGGACAGAGAAATTCAAAATTACACAAAGATAATATACAACTTACTTAAAGAATCGCAAATCCAACAGAAAAAGAATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAA +MK114856.1,nef,7916,9176,8795,9416,forward,0.7587548638132295,MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MKKNY*N*INEQICRISLV*QNGYSI*KYS****EA**V*K*FLLYFL**IELGKDTHHYHCRPSSQPQEDQTGPKE*KKKVKRETEADPED**LDSYHSSKTTCKACAFSATTT*KTYS*LC*RLCKF*DTRSKRSSSTSRVSCSIKFRN*RIVLLACSIP*LSQ*LKEQIKL*K*DKKLAELFSTYLER*DKA*KRLCNKISGK*SKSCMAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAAAATAAGTGGCAAGTAGTCAAAAAGTTGTATGGCTAGATAGCCTGCTGTAAAAGAAAGAATAGAAAGAGTTAATCCAAGGCCTGCTGCAAAGAAAGAACAAGCTGAGCCAGCAGCAGCTAAGGTAAGAGCAGCATCTCGAGACTTAGAAAAATATAGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTAGCTAGAAGCACAAGAGGAAGAAGAAGTAGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTAAATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTAGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGAAATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATAGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +MK114856.1,tat_exon2,8102,8198,8375,8471,forward,0.7134052388289676,RPSSQPQEDQTGPKE,RPSSQPQEDQTGPKE*KKKVKRETEADPED**,AGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGA +MK114856.1,rev_exon2,8103,8379,8376,8652,forward,0.6888374145157732,ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE,DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE*,GACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAG MK115009.1,gag,302,1715,789,2292,forward,0.7484174646972894,MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC,MGARASVLSGGKLDR*EKIYLRPEGKKKYRLKHIV*ASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPLSPRTLNA*VKVIEEKAFSPEVIPMFSALSERATPQDLNTMLNTVRGHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRGSDIAGTTSTLQEQIR*MTHNPPIPVGEIYKRWIILRLNKIVRMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC*KCRKERHQMKDCTKRPD*DG*FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*,ATGGGTGCTAGAGCGTCAGTATTAAGCGGCGGAAAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGAAGGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATAGTACATCAACCATTATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAAGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATAGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAAGAACCAAGAGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAAGGCTAAACAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAAGAACCCTTTAAAGATTATGTAGACCGATTCTATAAAACTCTAAAGGCTGAGCAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAAGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATAGTGCAAGGAGGCAATTTTAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAAGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAAAAATGTAGAAAGGAAAGACACCAAATGAAAGATTGTACTAAGAGACCAGACTAAGACGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGA MK115009.1,pol,1613,4625,2084,5096,forward,0.7535201229073285,AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*GRGNSSSSEAGDERPRTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEINLPGK*KPKMIKRIRSFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKSGIDSPRVKQWPLTEEKIKALIEICAEIEKEKKITKIRPENPYNTPVFAIKKKDSTK*KKLVDFRELNKRTQDF*EVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPEVKYQYNVLPQR*KRSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLR*GLTTPDKKHQKKPPFL*ISYELHPDK*TVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQRRDQ*TYQIYQEPFKNLKTEKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*KMWWTKYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVNKAANRKTKLRKAEYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIEGNEQVDKLVSNRIRRVLFLDRIDKAQEEHEKYHSN*RAMASNFNLPPVVAKEIVASCDKCQLKGEPMHRQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGR*PVKIIHTDNGSNFTSTTVKAAC**AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGAGGAAGAGGCAACAGCTCCTCCTCAGAAGCAGGAGACGAAAGACCAAGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATGATAAAAAGAATTAGAAGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACGCCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGTCAGGAATAGATAGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAGGAAAAGAAAATTACAAAAATTAGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAAAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTAAGAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGAAGTTAAATATCAGTACAATGTGCTTCCACAGAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAGGTGAGGACTCACCACACCAGACAAGAAACATCAGAAAAAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTGATAAATAGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTGAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGAGGAGAGACCAATAGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGAAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAGAAAATGTGGTGGACAAAGTATTGGCAAGCCACCTAGATTCCTGAGTAAGAATTTGTCAATACCCCTCCCTTAGTAAAACTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAAATAAGGCAGCTAATAGAAAGACTAAATTAAGAAAAGCAGAGTATGTTACGGACAGAAGAAGACAAAAGGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAGATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTGAAGGAAATGAACAAGTAGATAAATTAGTCAGTAATAGAATCAGAAGAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAGAGAGCAATGGCTAGTAATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATAGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATAGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAAGCCGCCTGTTAGTAGGCAGAGATCAAGCAGGAATTTAGTATTCCCTACAATCCTCAAAGTCAAAGAGTAGTAAAATCTATGAATAATAAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115009.1,vif,4289,4988,5040,5619,forward,0.7624714704923379,MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*NIEQFSKTPYAYFKESSEIGLQTSL*KP*SKNKFRSTHPIRGSKIGNKNILRSAYRRKRLAFRPGSIHRMEEKEI*HTSRPWPGRPTNSPVLF*LFFRICYKECHIRT*S*S*V*ISGRT*,ATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATAGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATAGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGAGGAAGCAAGATTGGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAA -MK115009.1,vpr,5087,5249,5558,5843,forward,0.6703246973639554,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAG -MK115009.1,tat_exon1,5235,5577,5830,6046,forward,0.6325105553751218,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115009.1,rev_exon1,5497,5578,5969,6047,forward,0.564475664826894,MAGRSRDSDEELLTAVRIIKRLYQSSK,MAGRSRDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115009.1,vpu,5589,5835,6259,6310,forward,0.7710195148641255,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*,ATGCATGCCTTAGAAATAGCAGCAATAGCAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAG -MK115009.1,env,5752,8353,6224,8795,forward,0.7518870380010406,MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD,MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATAAAGTACCTGTATAGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTAGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTAGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAACTTGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATGAAAGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTAATGTAGTACCAATAGATGAAGATAGTAAAAATACTACGGGCAAATATAAGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTAAACGGCAGTCTAGCAGAAGAAAAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATAGAACAGACATAATAAGAGATATAAGACAAGCGCATTATAACATTAGTAAGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGAAGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAGTACTTAGAATAGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAAGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTAGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTAGAGGAAGAGATATGAAGGACAATTAGAGAAGTAAATTATATAAATATAAAGTAGTCAAAATTAAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAAGGAAAAAAGAGCAATAAGACTTGAAGCTTTCTTCCTTAGGTTCTTAAGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACAGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAAAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTAAGGATTTAAAGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAAGAAAAAGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA -MK115009.1,nef,7748,8996,8796,9417,forward,0.7344808947652905,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR,MNKTYWH*ISRQVCKISLTLHSSYSI*KYS****EA**V*E*FLLYCL**IKLGKDTHHCHCRPSSQPREDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*KTYS*LRREL*NF*DAESKKH*SISRISCSIRVRK*RIVQLACSTPQQ*Q*LRGQIKL*KYYKEALELFSTYLHE*DRA*KRLCYKIGNKLSRRLKARWPAIKEKIRRARPVREPEPATAKVRAASRDLKRHGALTSSNTAATNADVACLEAQQKKEEVSFPVRPQVPLRPMTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*,ATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAAGGCTAGATGGCCTGCCATAAAGGAGAAAATAAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAACAGCTAAGGTAAGAGCAGCATCTCGAGACCTGAAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGAAGAAAGAAGAGGTAAGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGAGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAAGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATAGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAAGTAGAAGAGGCCAGTGTAAGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATAGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA -MK115009.1,tat_exon2,7934,8027,8376,8469,forward,0.5633802816901408,RPSSQPREDPTGPKEQKKEVERKTEAHPRD,RPSSQPREDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAG -MK115009.1,rev_exon2,7935,8211,8377,8653,forward,0.6781884553958476,ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE,DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG +MK115009.1,vpr,5087,5378,5558,5849,forward,0.6737199868435482,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG +MK115009.1,tat_exon1,5235,5577,5829,6045,forward,0.6325105553751218,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115009.1,rev_exon1,5497,5578,5968,6046,forward,0.564475664826894,MAGRSRDSDEELLTAVRIIKRLYQSSK,MAGRSRDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK115009.1,vpu,5589,5835,6060,6309,forward,0.6256860592755216,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*,ATGCATGCCTTAGAAATAGCAGCAATAGCAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAG +MK115009.1,env,5752,8353,6223,8794,forward,0.7518870380010406,MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD,MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATAAAGTACCTGTATAGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTAGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTAGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAACTTGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATGAAAGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTAATGTAGTACCAATAGATGAAGATAGTAAAAATACTACGGGCAAATATAAGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTAAACGGCAGTCTAGCAGAAGAAAAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATAGAACAGACATAATAAGAGATATAAGACAAGCGCATTATAACATTAGTAAGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGAAGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAGTACTTAGAATAGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAAGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTAGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTAGAGGAAGAGATATGAAGGACAATTAGAGAAGTAAATTATATAAATATAAAGTAGTCAAAATTAAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAAGGAAAAAAGAGCAATAAGACTTGAAGCTTTCTTCCTTAGGTTCTTAAGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACAGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAAAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTAAGGATTTAAAGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAAGAAAAAGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA +MK115009.1,nef,7748,8996,8795,9416,forward,0.7328145265888457,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR,MNKTYWH*ISRQVCKISLTLHSSYSI*KYS****EA**V*E*FLLYCL**IKLGKDTHHCHCRPSSQPREDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*KTYS*LRREL*NF*DAESKKH*SISRISCSIRVRK*RIVQLACSTPQQ*Q*LRGQIKL*KYYKEALELFSTYLHE*DRA*KRLCYKIGNKLSRRLKARWPAIKEKIRRARPVREPEPATAKVRAASRDLKRHGALTSSNTAATNADVACLEAQQKKEEVSFPVRPQVPLRPMTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*,ATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAAGGCTAGATGGCCTGCCATAAAGGAGAAAATAAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAACAGCTAAGGTAAGAGCAGCATCTCGAGACCTGAAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGAAGAAAGAAGAGGTAAGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGAGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAAGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATAGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAAGTAGAAGAGGCCAGTGTAAGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATAGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115009.1,tat_exon2,7934,8027,8375,8471,forward,0.5633802816901408,RPSSQPREDPTGPKEQKKEVERKTEAHPRD,RPSSQPREDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAG +MK115009.1,rev_exon2,7935,8211,8376,8652,forward,0.6781884553958476,ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE,DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG MK115387.1,gag,292,1795,789,2292,forward,0.25442849599155104,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAGGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACACAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAAGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCGCAGGATGTAAAAAATTGGATGACAGAAACCTTATTGGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA MK115387.1,pol,1587,4599,2084,5096,forward,0.17509882471546434,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAGGGAAGATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAGAAATCAATAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAATAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATGGATGACTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTGGGGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAGACAATTATGTAAACTCCTTAAGGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGGGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGGGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATGGGATACCTGGTGGACAGAATATTGGCAAGCCACCTGGATTCCCGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAAAAAGAACCTATTGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAGGAATAATTCAAGCACAACCAGATAGGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAGGGTCTACCTTGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTCCTATTTTTGGATGGAATAGATAAGGCCCAAGAGGAGCATGAGAAATATCACAATAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAGGGAGAAGCCACGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTGGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115387.1,vif,4543,5122,5040,5619,forward,0.34158090650317496,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAGGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGCAGGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAG -MK115387.1,vpr,5061,5352,5558,5843,forward,0.5625083211290105,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTGGGACAACATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115387.1,tat_exon1,5332,5551,5830,6046,forward,0.37688442211055273,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGA -MK115387.1,rev_exon1,5471,5552,5969,6047,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG -MK115387.1,env,5726,8288,6224,8795,forward,0.52645935624659,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGGAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTACTTGGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATGAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAGAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAGGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATGGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAGGAAGCCATACAAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAGGACCAGGGAGAGCATTTTACACAACAGGAGATATAATAGGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAATAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAGGGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAGGGGAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTGGACTAAAAATGGTACTGGTAGTTGGCAGTCTAATGATACTCAGAATGGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGGAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAACTGTACATCAAATATTACAGGGCTGGTTTTAACAAGAGATGGGGGGAAGGTGATTAATGAAACTGAGACCTTTAGACCTGGAGGAGGAAATATGAAGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAAAGAGAGAAAAGAGCAGTAGGACTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCCGGAAGCACTATGGGCGCAGCGTCAATAGCGCTGACGGAACAGGCCAGACGAGTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATCGTAGTTGGGGTGGGCATAACAAAAATCTAGATGACATTTGGGGTAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAGAAAAGAATGAACAAGAATTATTGGCATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAGGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAGGGACAGATAGGATAATAGAAATATTACAAAGAATTGGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK115387.1,vpu,5770,5809,6259,6310,forward,0.5690703735881842,MGHHAPWNVDDL,MGHHAPWNVDDL*,ATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG -MK115387.1,tat_exon2,7869,7965,8376,8469,forward,0.6995153473344102,RPSSQLRGEPTGPKE,RPSSQLRGEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA -MK115387.1,rev_exon2,7870,8146,8377,8653,forward,0.32366339007432277,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAG -MK115387.1,nef,8289,8940,8796,9417,forward,0.46946145391741245,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTAGGGTTGGATGGAATGCAGTGAGGGAAAGAATGAGACGAGCTCAGCCAACAGCAGATAGGGAACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAATATGGAGCACTTACAAGTAGGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGATGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGGTTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA +MK115387.1,vpr,5061,5352,5558,5849,forward,0.2608047690014903,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTGGGACAACATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115387.1,tat_exon1,5332,5551,5829,6045,forward,0.37688442211055273,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGA +MK115387.1,rev_exon1,5471,5552,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG +MK115387.1,vpu,5563,5809,6060,6309,forward,0.5560235888795282,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL*,ATGCAATCCTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTGGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAGGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG +MK115387.1,env,5726,8288,6223,8794,forward,0.5276672448389619,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGGAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTACTTGGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATGAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAGAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAGGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATGGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAGGAAGCCATACAAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAGGACCAGGGAGAGCATTTTACACAACAGGAGATATAATAGGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAATAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAGGGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAGGGGAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTGGACTAAAAATGGTACTGGTAGTTGGCAGTCTAATGATACTCAGAATGGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGGAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAACTGTACATCAAATATTACAGGGCTGGTTTTAACAAGAGATGGGGGGAAGGTGATTAATGAAACTGAGACCTTTAGACCTGGAGGAGGAAATATGAAGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAAAGAGAGAAAAGAGCAGTAGGACTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCCGGAAGCACTATGGGCGCAGCGTCAATAGCGCTGACGGAACAGGCCAGACGAGTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATCGTAGTTGGGGTGGGCATAACAAAAATCTAGATGACATTTGGGGTAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAGAAAAGAATGAACAAGAATTATTGGCATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAGGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAGGGACAGATAGGATAATAGAAATATTACAAAGAATTGGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115387.1,tat_exon2,7869,7965,8375,8471,forward,0.6995153473344102,RPSSQLRGEPTGPKE,RPSSQLRGEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA +MK115387.1,rev_exon2,7870,8146,8376,8652,forward,0.32366339007432277,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAG +MK115387.1,nef,8289,8940,8795,9416,forward,0.4631394979345408,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTAGGGTTGGATGGAATGCAGTGAGGGAAAGAATGAGACGAGCTCAGCCAACAGCAGATAGGGAACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAATATGGAGCACTTACAAGTAGGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGATGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGGTTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA MK115491.1,gag,521,2021,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115491.1,pol,1813,4825,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115491.1,vif,4769,5348,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115491.1,vpr,5287,5578,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115491.1,tat_exon1,5558,5777,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115491.1,rev_exon1,5697,5778,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115491.1,env,5952,8493,6224,8795,forward,0.4564898680537425,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115491.1,vpu,5990,6035,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115491.1,tat_exon2,8074,8170,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115491.1,rev_exon2,8075,8351,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115491.1,nef,8494,9109,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115491.1,vpr,5287,5578,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115491.1,tat_exon1,5558,5777,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115491.1,rev_exon1,5697,5778,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115491.1,vpu,5789,6035,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115491.1,env,5952,8493,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115491.1,tat_exon2,8074,8170,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115491.1,rev_exon2,8075,8351,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115491.1,nef,8494,9109,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK116110.1,gag,62,1601,140,1643,forward,0.7362754920106639,MSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ,MAGSPHSLTCCHHFF*CSCWSQCF*NSLTIWVCILDQQGFCHPIFYIL*SLLGS*GFIEPVYIVSKGFLWSLFYVQNADRTIHSYYFI*SQDYPSFIDISYWDRWIICHPSYLFLKGTSSSCYITSPWFSHLAWCNRPCMHWMQSIPFCSFLIDGLF*YLHCCLMSPHCI*HGVYILWGGSFC*C*KHRYYFWAKSLFFYYFYPCI*SSR*HGLMYHLPLEVLHYRVVLADLAVISCASCCLLCFHLAFVLLFLYLI*RSLGVLYLYPLMYTIEDRYCII**FKLF*PCLEGWL*LSQYLSTAF*CF*QARINCESF*LPACPY*MF*PIFFLSSWP*PNFFPLV*FSPA*Y*RSRTHLSPSSLR*VKTFLAYSPVAEAMSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ*,ATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCTGGTCCCAATGCTTTTAAAATAGTCTTACAATCTGGGTTTGCATTTTGGACCAACAAGGTTTCTGTCATCCAATTTTTTACATCCTGTGAAGCTTGCTCGGCTCTTAGGGTTTTATAGAACCGGTCTACATAGTCTCTAAAGGGTTCCTTTGGTCCTTGTTTTATGTCCAAAATGCTGACAGGACTATACATTCTTACTATTTTATTTAATCCCAGGATTACCCATCTTTTATAGATATCTCCTACTGGGATAGGTGGATTATTTGTCATCCATCCTATTTGTTCCTGAAGGGTACTAGTAGTTCCTGCTATATCACTTCCCCTTGGTTCTCTCATTTGGCCTGGTGCAACAGGCCCTGCATGCACTGGATGCAATCTATCCCATTCTGCAGCTTCCTCATTGATGGTCTCTTTTAATATTTGCATTGCTGCTTGATGTCCCCCCACTGTATTTAGCATGGTGTTTATATCTTGTGGGGTGGCTCCTTCTGCTAATGCTGAAAACATAGGTATTACTTCTGGGCTAAAAGCCTTTTCTTCTACTACTTTTACCCATGCATTTAAAGTTCTAGGTGACATGGCCTGATGTACCATTTGCCCCTGGAGGTTTTGCACTATAGGGTAGTTTTGGCTGACCTGGCTGTTATTTCCTGCGCCAGCTGCTGCTTGCTGTGCTTTCATCTTGCTTTTGTTTTGCTCTTCCTCTATCTTATCTAGCGCTCCCTTGGTGTCTTGTATCTCTATCCTTTGATGTATACAATAGAGGACCGCTACTGTATTATATAATGATTTAAGCTCTTCTGACCCTGTTTGGAGGGATGGCTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGCTCCCTGCTTGCCCATACTAGATGTTTTAACCTATATTTTTTCTTTCCTCCTGGCCTTAACCGAATTTTTTCCCATTGGTCTAATTTTCCCCCGCTTAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGGTAAAAACTTTTTTGGCGTACTCACCAGTCGCCGAAGCAATGAGCCAAGTAAATTCAACTACCGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAAGAAGACTGTTAAGTGTTTCAACTGTGGTAAAATAGGGCATATAGCAAAAAATTGCAGGGCCCCCAGGAGAAAGGGCTGTTGGAAATGTGGACAGGAAGGACACCAGATGAAAGATTGTAGTGAGAGACAGGCTAATTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAA MK116110.1,pol,1393,4405,1435,4447,forward,0.2475474244944199,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED*,TTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAAAAGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGTGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGATCAGATACCCATAGAAATCTATGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATTTGTTGACTCAGATTGGGTGCACTTTAAATTTTCCCATTAGTCCTATCGAAACTGTACCAGTAAGATTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAGATTTCAAAGATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAGAGAACTCAAGATTTCTGGGAAGTTCAATTGGGAATACCGCATCCCGCAGGATTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCATTAGATAAAGACTTTAGGAAGTATACTGCATTTACCATACCCAGTGTAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAGCTAGCATGACAAAAATTTTAGAGCCTTTTAGGAAGCAAAATCCAGACATGGTTATTTATCAATACATGGATGATCTATATATAGGATCTGACTTGGAATTAGGACAGCATAGGACAAAAATAGAGGAACTGAGACAACATCTATTGAGGTGGGGGTTTACCACACCAGACAAGAAGCATCAGAAAGAACCTCCATTCCTCTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAACACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTAGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAGGCAGTTATGTAAACTCCTTAGAGGAACCAAATCACTAACAGAAGTAGTACCACTAACAAGAGAGGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAATTACAAAAGCAGGGACAAGGCCAGTGGACTTATCAGATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATAAAGGGTACCCACACTAATGATGTAAAACAATTAACACAGGCTGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGACCCCATAGTAGGAGCAGAAACATTCTATGTCGATGGGGCAGCCAATAGGGATACTAAATTAGGAAAAGCAGGATATGTTACTGACAGGGGAAGACAAAAAATTGTCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTTACCTAGCTCTGCAGGATTCAGGATCAGAAGTAAACATAGTATCAGACTCACAGTATGCAATAGGAATTCTTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGACATGGGTGCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTATTATTCTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCCATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGTTAAAAGGAGAAGCCATACATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTGGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTGGCCAGTGGATATATTGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATATTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAACACAATACATACAGACAATGGCAGCAACTTCACTAGCACTGCGGTTAAAGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGGGATCAAGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGAGGTACAGTGCAGGGGAAAGAATAGTAGACATGATAGCATCAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGACTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAA MK116110.1,vif,4349,4928,4391,4970,forward,0.4686663095875737,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAATGCATGGAAAAGCTTAGTAAAGCACCATATGCATGTTTCAAGGAAAGTTGAGAGATGGGTTTATAAACATCACTATGAAAGTACTAATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAAAAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAAGAGCTATAATACACAAGTAGACCCTGAAGTAGCAGACCAACTAATCCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAAAGCCATAGTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCCCTACAGTACTTGGCATTAGCAGCATTAGTAAAATCAAAAAAGACAAAGCCACCTTTGCCTAGCGTTACGAAGCTGACGGAGGATAGATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAG @@ -233,168 +233,168 @@ MK116110.1,nef,8074,8695,8125,8752,forward,0.437094682230869,MGGKWSKSSVVGWPAVRER MK115527.1,gag,683,2183,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115527.1,pol,1975,4987,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115527.1,vif,4931,5510,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115527.1,vpr,5449,5740,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115527.1,tat_exon1,5720,5939,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115527.1,rev_exon1,5859,5940,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115527.1,env,6114,8655,6224,8795,forward,0.4564898680537425,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115527.1,vpu,6152,6197,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115527.1,tat_exon2,8236,8332,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115527.1,rev_exon2,8237,8513,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115527.1,nef,8656,9271,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115527.1,vpr,5449,5740,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115527.1,tat_exon1,5720,5939,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115527.1,rev_exon1,5859,5940,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115527.1,vpu,5951,6197,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115527.1,env,6114,8655,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115527.1,tat_exon2,8236,8332,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115527.1,rev_exon2,8237,8513,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115527.1,nef,8656,9271,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK114997.1,gag,210,1719,789,2292,forward,0.27936962750716343,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACACAATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGCACTTTAAATGCATGGGTAAAAGTGATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGATCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCCTCCATAATGGCGCAAGGAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA MK114997.1,pol,1511,4523,2084,5096,forward,0.26443159013103534,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAGAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGACAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACCAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTCCATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTAACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCCGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK114997.1,vif,4467,5046,5040,5619,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTAGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCCTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG -MK114997.1,env,4985,8207,6224,8795,forward,0.6663239775063792,MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*LRALETSRKSTYDCL*QLLL*TVLLSLPSLLHHKRLRHLLWQEEAETATKSFSQQSESSSGSTRAVSITCNACLKNSSNSRISSSNNNSNSCVVYSINRI*ENFKTKENRQVN**NKRKSRRQWQ*K*RRPGGIISTCGDGASCSLGW**YVVPTTCGSQSIMGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAGTATTACATGTAATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGAAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAGTTTAAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAGACTTGATGTAGTATCAATAGATGAAGATAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGATATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAACCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGAGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAAAAAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAACACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCTCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAGTGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAGGCAGTGGGAAAAGGAAATTGACAATTACACAGACACAATATATAACTTAATTGAACTATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAGTTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTACTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK114997.1,vpr,4985,5276,5558,5843,forward,0.5793112277557293,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK114997.1,tat_exon1,5256,5475,5830,6046,forward,0.4691531785127845,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK114997.1,rev_exon1,5395,5476,5969,6047,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK114997.1,vpu,5694,5733,6259,6310,forward,0.6901936289818864,MGHLVPWDGDDM,MGHLVPWDGDDM*,ATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG -MK114997.1,tat_exon2,7788,7881,8376,8469,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG -MK114997.1,rev_exon2,7789,8065,8377,8653,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG -MK114997.1,nef,8208,8850,8796,9417,forward,0.5478186258332784,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTTCAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTTCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGTCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAATATTTCAAGGACTGCTGA +MK114997.1,env,4985,8207,6223,8794,forward,0.6657028690558922,MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*LRALETSRKSTYDCL*QLLL*TVLLSLPSLLHHKRLRHLLWQEEAETATKSFSQQSESSSGSTRAVSITCNACLKNSSNSRISSSNNNSNSCVVYSINRI*ENFKTKENRQVN**NKRKSRRQWQ*K*RRPGGIISTCGDGASCSLGW**YVVPTTCGSQSIMGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAGTATTACATGTAATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGAAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAGTTTAAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAGACTTGATGTAGTATCAATAGATGAAGATAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGATATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAACCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGAGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAAAAAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAACACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCTCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAGTGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAGGCAGTGGGAAAAGGAAATTGACAATTACACAGACACAATATATAACTTAATTGAACTATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAGTTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTACTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK114997.1,vpr,4985,5276,5558,5849,forward,0.3120665742024965,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK114997.1,tat_exon1,5256,5475,5829,6045,forward,0.4691531785127845,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK114997.1,rev_exon1,5395,5476,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK114997.1,vpu,5487,5733,6060,6309,forward,0.5568484042553192,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK114997.1,tat_exon2,7788,7881,8375,8471,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK114997.1,rev_exon2,7789,8065,8376,8652,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK114997.1,nef,8208,8850,8795,9416,forward,0.5432971135257649,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTTCAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTTCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGTCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAATATTTCAAGGACTGCTGA MK115518.1,gag,739,2239,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115518.1,pol,2031,5043,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115518.1,vif,4987,5566,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115518.1,vpr,5505,5796,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115518.1,tat_exon1,5776,5995,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115518.1,rev_exon1,5915,5996,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115518.1,env,6170,8711,6224,8795,forward,0.45675101255163,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115518.1,vpu,6208,6253,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115518.1,tat_exon2,8292,8388,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115518.1,rev_exon2,8293,8569,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115518.1,nef,8712,9327,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115518.1,vpr,5505,5796,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115518.1,tat_exon1,5776,5995,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115518.1,rev_exon1,5915,5996,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115518.1,vpu,6007,6253,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115518.1,env,6170,8711,6223,8794,forward,0.4583799776107468,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115518.1,tat_exon2,8292,8388,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115518.1,rev_exon2,8293,8569,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115518.1,nef,8712,9327,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115065.1,gag,221,1730,789,2292,forward,0.2880084183556756,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCCAAGGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGCTGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA MK115065.1,pol,1522,4534,2084,5096,forward,0.25117173416656646,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGATTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTATCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAAATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCTATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAGTGGAATCAGAAAAGTACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115065.1,vif,4478,5057,5040,5619,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG -MK115065.1,vpr,4996,5287,5558,5843,forward,0.5872377841979652,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115065.1,tat_exon1,5267,5486,5830,6046,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115065.1,rev_exon1,5406,5487,5969,6047,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115065.1,env,5661,8262,6224,8795,forward,0.5065440396179699,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAGTACTTGGAATGGTACTGACAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATAGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACCTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK115065.1,vpu,5705,5744,6259,6310,forward,0.6901936289818864,MGHLVPWDGDDM,MGHLVPWDGDDM*,ATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG -MK115065.1,tat_exon2,7843,7936,8376,8469,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG -MK115065.1,rev_exon2,7844,8120,8377,8653,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG -MK115065.1,nef,8263,8905,8796,9417,forward,0.5386842636859471,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTACCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAGAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115065.1,vpr,4996,5287,5558,5849,forward,0.3351206434316354,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115065.1,tat_exon1,5267,5486,5829,6045,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115065.1,rev_exon1,5406,5487,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK115065.1,vpu,5498,5744,6060,6309,forward,0.5568484042553192,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK115065.1,env,5661,8262,6223,8794,forward,0.5052314240113498,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAGTACTTGGAATGGTACTGACAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATAGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACCTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115065.1,tat_exon2,7843,7936,8375,8471,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK115065.1,rev_exon2,7844,8120,8376,8652,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK115065.1,nef,8263,8905,8795,9416,forward,0.5339772804571117,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTACCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAGAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA MK115464.1,gag,527,2297,789,2292,forward,0.706855791962175,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MLQAIPGLRVGPAGSHPFALTSLSASCCHQSQSPGCSGATARTGT*KRK*NQRSSLDAGLGLLKRARQEARGGDW*VRQF*LAEARRREISARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADKGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAE*DRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIA*MTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGCTTCAGGCCATCCCTGGTTTGAGGGTGGGTCCCGCCGGGTCCCACCCCTTTGCACTCACGAGCCTGTCTGCCTCCTGCTGCCATCAATCACAGAGCCCAGGCTGTTCGGGCGCCACTGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGAGGCGGCGACTGGTGAGTACGCCAATTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAAGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAAGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACAAAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATAGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATAAGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATAGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCACAGGATGTAAAAAATTAGATGACAGAAACCTTATTAGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTAAGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAAGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA MK115464.1,pol,2089,5101,2084,5096,forward,0.7518376924488996,AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED,FFKEDLAFLQRKAKELSSEQTRANSPTRRELQV*GGDSNSSSEAGAGGQRSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEISLPGR*KPKMIEGIGGFIKVRQYDQITIEICGHKAIGTVLVGPTPVNIIGRNLLTQISCTLNFPISPIETVPVQLKPGIDSPKVKQWPLTEEKIKALVEICTEMEKEKKISKIRPENPYNTPVFAIKKKDSTK*RKLVDFKELNKRTQDF*EVQLRIPHPARLKKKKSITVLDVGDAYFSIPLDKDFKKYTAFTIPSINNKTPEIRYQYNVLPQG*KRSPAIFQSSMIKILEPFRKQNPDIVIYQYIDDLYVRSDLEIRQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFLWISYELHPDKWTVQPIVLPDKDSWTVNDIQKLVRKLN*ASQIYAEIKVRQLCKLLKGAKALTEVIQLTEEAELELAENKEILKEPVHEVYYDPSKDLIAELQKQRQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVI*GKTPRFKLPIQKET*DT*WTEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVGAETFYVDRAANKETKLRKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALRIIQAQPDKSESEIVNQIIEQLIKKEKVYLA*VPAHKRIRRNEQVDKLVSARIRKVLFLDRIDKAQEEHKKYHNN*RAMASDFNLPPVVAKKIVASCDKCQLKKEATHRQVDCSPRIWQLDCTHLEGKVILVAVHVASRYIEAEVIPAETGQETAYFLLKLAGR*PVKAIHTDNGTNFTSATVKAAC**AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATAAGTTTGCCAGGAAGATAGAAACCAAAAATGATAGAAGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATAACTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTAGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAACCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAAAAAAGATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAGAAAATTAGTAGATTTCAAGGAACTTAATAAAAGAACTCAAGACTTCTAAGAAGTTCAATTAAGAATACCACACCCCGCAAGGTTAAAAAAGAAGAAATCAATAACAGTACTAGATGTAGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAAGAAGTATACTGCATTTACCATACCTAGTATAAATAATAAGACACCAGAGATTAGATATCAGTACAATGTGCTTCCACAGGGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATAGATGACTTGTATGTAAGATCTGACTTAGAAATAAGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTAGAGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATAAGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTAAGAAAATTGAATTGAGCAAGTCAGATTTATGCAGAGATTAAAGTGAGACAATTATGTAAACTCCTTAAAGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAAGAAATTCTAAAAGAACCAGTACATGAAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGAGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGAGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGAGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATAAGATACCTAGTGGACAGAATATTGGCAAGCCACCTAGATTCCCGAGTAAGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATAGTACCAATTAGAAAAAGAGCCTATTGTAGGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAAAGAGACTAAATTAAGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAAGAATAATTCAAGCACAACCAGATAAGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTACCTTGCATAGGTACCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTGCTAGAATCAGGAAAGTCCTATTTTTAGATAGAATAGATAAGGCCCAAGAAGAGCATAAGAAATATCACAATAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAAAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAAAAAGAAGCCACGCATAGACAAGTAGACTGTAGTCCAAGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTAGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTAGTAGGCAAAGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAAGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115464.1,vif,5045,5624,5040,5619,forward,0.7067546928117459,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY*GLHTGERDWHLGQGVSIEWKERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRRSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAAGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTAGGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGTCAAGGAGTCTCCATAGAATGGAAGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAG -MK115464.1,vpr,5563,5854,5558,5843,forward,0.5898566703417862,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG -MK115464.1,tat_exon1,5563,6052,5830,6046,forward,0.7571801566579635,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*IRALEASRKSA*DSLYQMLL*KMLLSLPSLFHNKRLRHLLWQEEAETATKTSSRQSDSSSTSTKAV,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTG -MK115464.1,rev_exon1,5973,6054,5969,6047,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG -MK115464.1,env,6228,8799,6224,8795,forward,0.7471048806788873,MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST,MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAAGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGAAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTTCTAATACTACTTAGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATAAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAAAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAAGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATAGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAAGAAGCCATACGAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAAGACCAGGAAGAGCATTTTATACAACAGGAGATATAATAAGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAGTAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAAAGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAAAGAAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTAGACTAAAAATGGTACTGATAGTTGGCAGTCTAATGATACTCAGAATAGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCCATCAGTAGACAAATTAACTGTACATCAAATATTACAGGGCTAGTTTTAACAAGAGATAGGAGGAATGAAACTAAGACCTTTAGACCTGGAAGAGAAAATATGAAGGATAATTGGAGAAGTAAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAAGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAGAAAAGAGCAGTAAGACTAGGAGCTATGTTCCTTAAGTTCTTAGGAGCAGCCAGAAGCACTATAGGCGCAGCGTCGATAGCGCTGACGGAACAGGCCAGACGAGTCTTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTAAGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATCGTAGTTGAGGTAGGCATAACAAAAATTACAAAAGTCTAGATGACATTTAGGATAACATGACCTAGATAGAGTAGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAAAAAAGAATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA -MK115464.1,vpu,6228,6276,6259,6310,forward,0.7611885546588408,MRVKEIKRSYQHL,MRVKEIKRSYQHL*R*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAG -MK115464.1,nef,8194,9451,8796,9417,forward,0.6542937183493158,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MNKNYWH*INRQVCRISLTYHNGCGI*KYS****EA**V*E*FLLYFL**IKLGKDTHHYHFRPSSQPREEPTGPKE*KKEVERETKADPVD**TDS*HLSRTIYGAYASSATTA*ATYS*L*SRLWNF*DARGKKPSNISRISCSTRVRN*RIVLSACSTPQL***LKGQIR**KYYKELVELFSTYLGE*DRA*KRLCYKIGGKWSKSSKVK*NAVKERIRRAQPTADKERAEPAADKVRAASRDLEKYGALTSKNTAATNADCAWLEAQEEEDEVGFPVRPQLPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTGGCAAGTGGTCAAAAAGTAGTAAGGTTAAATAGAATGCAGTGAAAGAAAGAATAAGACGAGCTCAGCCAACAGCAGATAAAGAACGAGCTGAGCCAGCAGCAGATAAGGTAAGAGCAGCATCTAGAGACCTAGAAAAATATGGAGCACTTACAAGTAAGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGATGAGGTAGGTTTTCCAGTCAGACCTCAGTTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAAGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATAGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGATTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA -MK115464.1,tat_exon2,8380,8476,8376,8469,forward,0.6995153473344102,RPSSQPREEPTGPKE,RPSSQPREEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA -MK115464.1,rev_exon2,8381,8657,8377,8653,forward,0.5716671727907683,RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE,DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAG +MK115464.1,vpr,5563,5854,5558,5849,forward,0.37688442211055273,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG +MK115464.1,tat_exon1,5563,6052,5829,6045,forward,0.7571801566579635,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*IRALEASRKSA*DSLYQMLL*KMLLSLPSLFHNKRLRHLLWQEEAETATKTSSRQSDSSSTSTKAV,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTG +MK115464.1,rev_exon1,5973,6054,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG +MK115464.1,vpu,6065,6311,6060,6309,forward,0.7521692502681095,MQSLYILTIVALVVAAILAIVV,MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*,ATGCAATCTTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTAGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAAGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAG +MK115464.1,env,6228,8799,6223,8794,forward,0.7471048806788873,MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST,MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAAGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGAAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTTCTAATACTACTTAGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATAAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAAAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAAGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATAGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAAGAAGCCATACGAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAAGACCAGGAAGAGCATTTTATACAACAGGAGATATAATAAGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAGTAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAAAGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAAAGAAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTAGACTAAAAATGGTACTGATAGTTGGCAGTCTAATGATACTCAGAATAGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCCATCAGTAGACAAATTAACTGTACATCAAATATTACAGGGCTAGTTTTAACAAGAGATAGGAGGAATGAAACTAAGACCTTTAGACCTGGAAGAGAAAATATGAAGGATAATTGGAGAAGTAAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAAGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAGAAAAGAGCAGTAAGACTAGGAGCTATGTTCCTTAAGTTCTTAGGAGCAGCCAGAAGCACTATAGGCGCAGCGTCGATAGCGCTGACGGAACAGGCCAGACGAGTCTTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTAAGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATCGTAGTTGAGGTAGGCATAACAAAAATTACAAAAGTCTAGATGACATTTAGGATAACATGACCTAGATAGAGTAGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAAAAAAGAATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA +MK115464.1,nef,8194,9451,8795,9416,forward,0.6514772974147296,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MNKNYWH*INRQVCRISLTYHNGCGI*KYS****EA**V*E*FLLYFL**IKLGKDTHHYHFRPSSQPREEPTGPKE*KKEVERETKADPVD**TDS*HLSRTIYGAYASSATTA*ATYS*L*SRLWNF*DARGKKPSNISRISCSTRVRN*RIVLSACSTPQL***LKGQIR**KYYKELVELFSTYLGE*DRA*KRLCYKIGGKWSKSSKVK*NAVKERIRRAQPTADKERAEPAADKVRAASRDLEKYGALTSKNTAATNADCAWLEAQEEEDEVGFPVRPQLPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTGGCAAGTGGTCAAAAAGTAGTAAGGTTAAATAGAATGCAGTGAAAGAAAGAATAAGACGAGCTCAGCCAACAGCAGATAAAGAACGAGCTGAGCCAGCAGCAGATAAGGTAAGAGCAGCATCTAGAGACCTAGAAAAATATGGAGCACTTACAAGTAAGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGATGAGGTAGGTTTTCCAGTCAGACCTCAGTTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAAGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATAGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGATTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA +MK115464.1,tat_exon2,8380,8476,8375,8471,forward,0.6995153473344102,RPSSQPREEPTGPKE,RPSSQPREEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA +MK115464.1,rev_exon2,8381,8657,8376,8652,forward,0.5716671727907683,RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE,DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAG MK115530.1,gag,746,2246,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115530.1,pol,2038,5050,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115530.1,vif,4994,5573,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115530.1,vpr,5512,5803,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115530.1,tat_exon1,5783,6002,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115530.1,rev_exon1,5922,6003,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115530.1,env,6177,8718,6224,8795,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115530.1,vpu,6215,6260,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115530.1,tat_exon2,8299,8395,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115530.1,rev_exon2,8300,8576,8377,8653,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115530.1,nef,8719,9334,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115530.1,vpr,5512,5803,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115530.1,tat_exon1,5783,6002,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115530.1,rev_exon1,5922,6003,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115530.1,vpu,6014,6260,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115530.1,env,6177,8718,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115530.1,tat_exon2,8299,8395,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115530.1,rev_exon2,8300,8576,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115530.1,nef,8719,9334,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115520.1,gag,695,2195,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115520.1,pol,1986,5004,2084,5096,forward,0.6033592883813991,YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,IF*GKSGLPTKEGQGTSFRADQSQQPHQKRASGLGKRQ*LPLRSRSQETRNCIPCLPSNHSLAATPRQNKNRGAI*RSFLRYRSR*YSIRRNEFARKMETKNDRGNWRFYQSKTV*SDTHRNLWTQSYRYSINRTYTCQHNWKKSVDSAWLYLKFSH*SY*NCTSKIKARNGWPKS*TMAIDRRKNKSISRNLYRNGKGRKNFKNWA*KSIQYSSICYKEKRQY*MEKISRFQRTQ*ENSRLLGSSIRNTTSCRVKKEKISNSTGCG*CIFFNSLR*RIQEVYCIYHT*YK**DTRD*V*VQCAATGMERITSNIPK*HDKNLRAF*KAKSRYSYLSIHG*FVCRI*LRNRAA*NKNRGTKTTSVKVGTYHTRQKTSERTSIPLDGL*TPS*YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,ATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATATGGGAAATGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115520.1,vif,4948,5527,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115520.1,vpr,5466,5757,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115520.1,tat_exon1,5737,5956,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115520.1,rev_exon1,5876,5957,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115520.1,env,6131,8672,6224,8795,forward,0.4569687738004571,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115520.1,vpu,6169,6214,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115520.1,tat_exon2,8253,8349,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115520.1,rev_exon2,8254,8530,8377,8653,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115520.1,nef,8673,9288,8796,9417,forward,0.4756067663643049,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115520.1,vpr,5466,5757,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115520.1,tat_exon1,5737,5956,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115520.1,rev_exon1,5876,5957,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115520.1,vpu,5968,6214,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115520.1,env,6131,8672,6223,8794,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115520.1,tat_exon2,8253,8349,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115520.1,rev_exon2,8254,8530,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115520.1,nef,8673,9288,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115503.1,gag,817,2317,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115503.1,pol,2109,5121,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115503.1,vif,5065,5644,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115503.1,vpr,5583,5874,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115503.1,tat_exon1,5854,6073,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115503.1,rev_exon1,5993,6074,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115503.1,env,6248,8789,6224,8795,forward,0.4564898680537425,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115503.1,vpu,6286,6331,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115503.1,tat_exon2,8370,8466,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115503.1,rev_exon2,8371,8647,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115503.1,nef,8790,9405,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115503.1,vpr,5583,5874,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115503.1,tat_exon1,5854,6073,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115503.1,rev_exon1,5993,6074,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115503.1,vpu,6085,6331,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115503.1,env,6248,8789,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115503.1,tat_exon2,8370,8466,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115503.1,rev_exon2,8371,8647,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115503.1,nef,8790,9405,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115570.1,gag,687,2187,789,2292,forward,0.2967573174581697,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCGACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115570.1,pol,1979,4991,2084,5096,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115570.1,vif,4935,5514,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115570.1,vpr,5453,5744,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115570.1,tat_exon1,5724,5943,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115570.1,rev_exon1,5863,5944,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115570.1,env,6118,8659,6224,8795,forward,0.4604674291397314,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCTCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAGGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115570.1,vpu,6156,6201,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115570.1,tat_exon2,8240,8336,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115570.1,rev_exon2,8241,8517,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115570.1,nef,8660,9275,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115570.1,vpr,5453,5744,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115570.1,tat_exon1,5724,5943,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115570.1,rev_exon1,5863,5944,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115570.1,vpu,5955,6201,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115570.1,env,6118,8659,6223,8794,forward,0.4620723847297967,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCTCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAGGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115570.1,tat_exon2,8240,8336,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115570.1,rev_exon2,8241,8517,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115570.1,nef,8660,9275,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115509.1,gag,555,2055,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115509.1,pol,1847,4859,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115509.1,vif,4803,5382,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115509.1,vpr,5321,5612,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115509.1,tat_exon1,5592,5811,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115509.1,rev_exon1,5731,5812,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115509.1,env,5986,8527,6224,8795,forward,0.4564898680537425,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115509.1,vpu,6024,6069,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115509.1,tat_exon2,8108,8204,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115509.1,rev_exon2,8109,8385,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115509.1,nef,8528,9143,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115509.1,vpr,5321,5612,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115509.1,tat_exon1,5592,5811,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115509.1,rev_exon1,5731,5812,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115509.1,vpu,5823,6069,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115509.1,env,5986,8527,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115509.1,tat_exon2,8108,8204,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115509.1,rev_exon2,8109,8385,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115509.1,nef,8528,9143,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115702.1,gag,246,1782,789,2292,forward,0.35613851839948674,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ*SQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGCGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAGGAAACGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGCTTCGCAGTCAACCCTGGCCTGTTAGAAACATCAGAAGGCTGCAAACAAATAATGGGACAACTCCAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAGAGGATAGATGTAAAGGATACCAAAGAAGCTTTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCCGCTGACACAGGAAACAACAGCCAAGTCAGCCAAAATTACCCCATAGTGCAGAACATGCAGGGACAAATGGTACATCAGGCCATATCACCCAGAACCCTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCATTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAGGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCAGGCAGGACCTGTTGCACCAGGCCAGATAAGGGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACACATAATCCACCCGTCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAGACTCTAAGAGCTGAGCAAGCTTCACAGGAAGTAAAAGGTTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCAGCCATAAGGCAAGGGTTTTGGCAGAAGCAATGAGCCAAGCAACAGGTGCACATGCCATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAA MK115702.1,pol,1544,4586,2084,5096,forward,0.24526399193257942,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAAAGATAGGGGGGCAAATAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGAAATGGCGTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATAGCCATAGAAATTTGTGGACATAAAGCAATTGGTACAGTATTAGTAGGACCTACACCTGTCAATATAATTGGAAGAAATCTATTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAGTTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATAGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAGTGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGATTAAAAAAGAAAAAATCAATAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGATGAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATATTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGACGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGAGGACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAGGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAGATGGACAGTACAGCCTATAAAGCTGCCAGAGAAAGAAATCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATTAAAGTAAAACAATTATGTAAACTCCTTAGGGGAACCAAAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGAATTAATAGCAGAAATACAGAAGCAAGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCGAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAGAAAATATCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAGGAAACATGGGAAATATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTTAGTACTCCTCCCCTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCATCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATATTACTGACAGAGGAAGACAAAAGGTTGTCACCCTAAATGACACAACCAATCAAAAGACAGAGTTACAAGCAATTCTTCTAGCATTGCAGGATTCAGGATTAGAAGCAAACATAGTGACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGATCTACCTGACATGGGTACCAGCACATAAAGGAATTGGAGGAAATGAGCAAGTAGATAAATTAGTCAGTACTGGGATTAGGAAAGTATTATTTTTAGATGGAATAGATAGGGCCCAAGAAGAGCATGAGAGATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTCAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAATAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACACTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTACCACAGTTAAGGCCGCCTGTTGGTGGGCGGGGGTCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTGGTAGAATCTATGAATAAAGAATTAAAGAAAATAATAGGACAGGTCAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTTCAAAAATTCAAAACTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCGGTAGTAATACAGGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115702.1,vif,4530,5109,5040,5619,forward,0.3566796368352788,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAAGAAAACTAAGGGATGGTTTTATAGACATCACTATGAGAGCACTCATCCAAAAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTGAGTTGGTAGTAACAACATATTGGGGTTTGCAGCCAGGGGAAAGGGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAGGGAGATATAGAACACACGTGGACCCTAACCTAGCAGACCAACTAATTCATCTGCATTACTTTGATTGTTTTTCAGAATCTGCTATAAGACATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAAGAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACTAAACTAACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG -MK115702.1,vpr,5048,5339,5558,5843,forward,0.5731147540983608,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAACTTAAGCAGGAAGCTGTTAGGCATTTTCCTAGGCCATGGCTTCATAGCTTAGGGCAATATATCTATGAAACTTATGGGGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATGCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATCCCACAGAGGAGAGCAAGAAATGGATCCAGTAGATCCTAA -MK115702.1,tat_exon1,5319,5538,5830,6046,forward,0.5237430167597767,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ*,ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAA -MK115702.1,rev_exon1,5458,5539,5969,6047,forward,0.5622384937238494,MAGRSGDGDEDLLKAVRLIKTLYQSSK,MAGRSGDGDEDLLKAVRLIKTLYQSSK,ATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAAG -MK115702.1,env,5716,8257,6224,8795,forward,0.5208458282639616,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*,ATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAATGCTACAGAACAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACAACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATGGTATTAATAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGATCAAATGCAAGAGGACATAGTCAGCTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACCTTAAATTGCACTAATTTGACCATTGAGCCAAACAATGCTACTAAAGCCAATATTAGTGGGAGGTTAGAGGGGAAAGGAGAAATGACAAACTGCTCTTTCAATGTCACCACAAGCCTAAGAGATAAGAGGAAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTAGCAACAGGTGAAAATAATAACAGCTTTAGGTTGATAAGTTGTAATACCTCAGAGATTACACAGGCCTGTCCAAAGGTATCATTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAAAAGTTCAATGGAACAGGAAAATGTAACAATGTCAGCATAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAGTTAGATCTGCCAATTTCTCAGACAATACTAAGACCATAATAGTACAGCTGAACAAAACTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGGAGAAGTATACATATAGCACCAGGGAGAGCATTTTATGCAACAGGAGATATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAAAGAAGATTGGAATACCACTTTAAACCAGGTGGCTAAAAAATTACAAGAACAATTTGAGAATGCAACAATAGACTTTAAACCATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACGGAACTATTTTCTTGGAATGCTACAACAAAACTGTTTACTTGGAATGCTACAAATAGCAATAATGGAACCATCATACTCCCATGTAGAATAAAACAAATTATAAACATGTGGCAAGAGGTAGGAAAAGCAATGTATGCCCCTCCCATTCGTGGACAAATTAGATGTTCGTCAAATATTACAGGACTGCTATTAACAAGAGATGGTGGGACTAACGGGACAGGGAACAGGAATGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAGAAATTAAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGACCATAGGAGCTATGTTCCTTGGGTTCCTGGGGGCAGCAGGAAGCACTATGGGCGCAGCATCACTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCGATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATAAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGGTACCTAAGAGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATATTAGTTGGAGTAATAGAACTCTGAATAACATTTGGGACAATTTGACTTGGATGCAGTGGGATACAGAAATTAACAATTACACAAACAAAATATACCAATTACTTGAGGAAGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAATTTGTGGAATTGGTTTGACATATCAAACTGGCTGTGGTACATAAAAATATTCATATTAATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTAAATGCCACAGCCATAGTAGTAGCTGAGGGGACAGATAGGATTATAGAATTAGCACAAAGAATTTGTAGAGCAGAATAAGACAGGGCTTGA -MK115702.1,vpu,5760,5808,6259,6310,forward,0.70010183299389,MGHNAHHAPWDIND,MGHNAHHAPWDIND**,ATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA -MK115702.1,tat_exon2,7874,7970,8376,8469,forward,0.3921568627450981,RPASQSRGDPTGPKEPKKKVERETETDPTD,RPASQSRGDPTGPKEPKKKVERETETDPTD**,AGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGA -MK115702.1,rev_exon2,7875,8151,8377,8653,forward,0.3471418653089562,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*,GACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAG -MK115702.1,nef,8275,8896,8796,9417,forward,0.47444962236863253,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*,ATGGGTGGCAAGTGGTCAAAACATAGTAAGAGTGAATGGGCTGATGTAAGGGAAAGAATGGCACAAACTGAGGCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGATCTGGAAAGACATGGAGCAATCACAAGTAGCAATACAGCAACTAACAATGCTGCTTGTGCTTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAAACCTCAGGTGCCTTTGAGACCAATGACCTACAAGGGAGCTTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTATTCCCAAAAAAGACAAGACATCCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGAACCAGATTCCCACTGTGCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTGGAAGAAGCCAATAAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACCGAGAGAGAGGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTAGCCAGAGAGAAACATCCGGAGTACTTCAAGGACTGCTGA +MK115702.1,vpr,5048,5339,5558,5849,forward,0.3566796368352788,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAACTTAAGCAGGAAGCTGTTAGGCATTTTCCTAGGCCATGGCTTCATAGCTTAGGGCAATATATCTATGAAACTTATGGGGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATGCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATCCCACAGAGGAGAGCAAGAAATGGATCCAGTAGATCCTAA +MK115702.1,tat_exon1,5319,5538,5829,6045,forward,0.5237430167597767,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ*,ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAA +MK115702.1,rev_exon1,5458,5539,5968,6046,forward,0.5622384937238494,MAGRSGDGDEDLLKAVRLIKTLYQSSK,MAGRSGDGDEDLLKAVRLIKTLYQSSK,ATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAAG +MK115702.1,vpu,5550,5808,6060,6309,forward,0.6039004707464695,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND**,ATGTTATCTTTAGAAGTAATAGTAGCAATAACAGCATTAGTAGTAGCAGGAATAATAGCAATAGTTGTGTGGACCATAGTACTTATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAAGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA +MK115702.1,env,5716,8257,6223,8794,forward,0.5196110433453024,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*,ATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAATGCTACAGAACAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACAACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATGGTATTAATAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGATCAAATGCAAGAGGACATAGTCAGCTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACCTTAAATTGCACTAATTTGACCATTGAGCCAAACAATGCTACTAAAGCCAATATTAGTGGGAGGTTAGAGGGGAAAGGAGAAATGACAAACTGCTCTTTCAATGTCACCACAAGCCTAAGAGATAAGAGGAAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTAGCAACAGGTGAAAATAATAACAGCTTTAGGTTGATAAGTTGTAATACCTCAGAGATTACACAGGCCTGTCCAAAGGTATCATTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAAAAGTTCAATGGAACAGGAAAATGTAACAATGTCAGCATAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAGTTAGATCTGCCAATTTCTCAGACAATACTAAGACCATAATAGTACAGCTGAACAAAACTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGGAGAAGTATACATATAGCACCAGGGAGAGCATTTTATGCAACAGGAGATATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAAAGAAGATTGGAATACCACTTTAAACCAGGTGGCTAAAAAATTACAAGAACAATTTGAGAATGCAACAATAGACTTTAAACCATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACGGAACTATTTTCTTGGAATGCTACAACAAAACTGTTTACTTGGAATGCTACAAATAGCAATAATGGAACCATCATACTCCCATGTAGAATAAAACAAATTATAAACATGTGGCAAGAGGTAGGAAAAGCAATGTATGCCCCTCCCATTCGTGGACAAATTAGATGTTCGTCAAATATTACAGGACTGCTATTAACAAGAGATGGTGGGACTAACGGGACAGGGAACAGGAATGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAGAAATTAAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGACCATAGGAGCTATGTTCCTTGGGTTCCTGGGGGCAGCAGGAAGCACTATGGGCGCAGCATCACTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCGATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATAAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGGTACCTAAGAGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATATTAGTTGGAGTAATAGAACTCTGAATAACATTTGGGACAATTTGACTTGGATGCAGTGGGATACAGAAATTAACAATTACACAAACAAAATATACCAATTACTTGAGGAAGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAATTTGTGGAATTGGTTTGACATATCAAACTGGCTGTGGTACATAAAAATATTCATATTAATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTAAATGCCACAGCCATAGTAGTAGCTGAGGGGACAGATAGGATTATAGAATTAGCACAAAGAATTTGTAGAGCAGAATAAGACAGGGCTTGA +MK115702.1,tat_exon2,7874,7970,8375,8471,forward,0.32608695652173914,RPASQSRGDPTGPKEPKKKVERETETDPTD,RPASQSRGDPTGPKEPKKKVERETETDPTD**,AGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGA +MK115702.1,rev_exon2,7875,8151,8376,8652,forward,0.3471418653089562,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*,GACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAG +MK115702.1,nef,8275,8896,8795,9416,forward,0.4680383864671438,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*,ATGGGTGGCAAGTGGTCAAAACATAGTAAGAGTGAATGGGCTGATGTAAGGGAAAGAATGGCACAAACTGAGGCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGATCTGGAAAGACATGGAGCAATCACAAGTAGCAATACAGCAACTAACAATGCTGCTTGTGCTTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAAACCTCAGGTGCCTTTGAGACCAATGACCTACAAGGGAGCTTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTATTCCCAAAAAAGACAAGACATCCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGAACCAGATTCCCACTGTGCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTGGAAGAAGCCAATAAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACCGAGAGAGAGGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTAGCCAGAGAGAAACATCCGGAGTACTTCAAGGACTGCTGA MK115095.1,gag,2,1697,789,2292,forward,0.7478034493979825,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC,SGFSFTFKSLFGRHLGDLKAKEKPEELSRRRTRLAERARQEARRGD**VRRNF*LAEARRREIGARASVLSGGELDR*EKIYLRPGRKKKYRLKHIVWASRELERFAVNPGLLKSSEGCRQILGQLQPALQTGSEELRSLYNTIAVLYCVHQKINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPISPRTLNA*VKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVRRHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRRSDIAGTTSTLQEQIR*MTNNPPIPVGEIYKR*IILRLNKIVKMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC*KCGKKGHQMKDCTKRQANFLRKIWPSHKGRPKNFLQSRPEPTAPPAESFRFKEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,TCTGGTTTCTCTTTCACTTTCAAGTCCCTGTTCGGGCGCCATCTAGGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCACGGCAAGAGGCGAGGCGCGGCGACTAGTGAGTACGCCGAAATTTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGGGAGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAAAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAACCCATATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAAGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAAGCTGCAGAATAAGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAGGAACCAAGAAGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATAGATAATCCTGAGGTTAAATAAAATAGTAAAAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAGGAACCCTTTAAGGATTATGTAGACCGGTTCTATAAAACTCTAAAGGCTGAACAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAAGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATGGTGCAAGGAGGCAATTTAAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAGAAATGTGGAAAGAAAGGACACCAAATGAAAGATTGTACTAAGAGACAGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA MK115095.1,pol,1489,4501,2084,5096,forward,0.7624366800883231,KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK,FFKEDLAFPQGKAKEFSPEQTRANSPASRELQV*GRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIRRQLKEALLDTGADDTVLKEINLPGK*KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK*RKLVDFRELNKRTQDF*KVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPRVRYQYNVLPQR*KGSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFL*ISYELHPNKWTVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRRTKALTEVVPLTEEAELELAENKEILKEPVHRAYYDPSKDLIAEVQKQGGDQWTYQIYQKPFKNLKTKKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*EM**TEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVDRAANRETKLRKARYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIRRNEQVDKLVSSRIRKVLFLDRIDKAQEEHEKYHSN*RAMASDFNLPPVVAKEIVASCDKCQLKREPMHGQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAAC**ARIKQKFSIPYNPQSQGVVESMNNELKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKRGIGGYSAEERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLL*KGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAAGAAGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAAAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATAATAGAAGGAATTAGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAAAAATTTGTAGACATAAAGCTATAAGTACAGTATTAATAAGACCTACACCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAAGAAAGGAAAATTACAAAAATTAGGCCTAAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATAGAGAAAATTAGTAGATTTCCGAGAACTTAATAAAAGAACACAAGACTTTTAAAAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAAGAGTTAGATATCAGTACAATGTGCTTCCACAAAGATAGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAAGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAAGTAAAGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTAAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAAGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAGGAGATTCTAAAAGAACCAGTACATAGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGAGGAGACCAATGGACATATCAAATTTATCAGAAGCCATTTAAAAATCTGAAAACAAAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATAGAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAAGAAATGTAGTAGACAGAGTATTGGCAAGCCACCTAGATTCCTGAGTAGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAGAGAGACTAAATTAAGAAAAGCAAGGTATGTTACGGACAGAAGAAGACAAAAAGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAAATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTAGTAGAATCAGAAAAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAAGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAGGCCGCCTGTTAGTAGGCAAGGATCAAGCAGAAATTTAGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAAGGGGGATTGGGGGGTACAGTGCAGAGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTAGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAG MK115095.1,vif,4445,5024,5040,5619,forward,0.7494633160752622,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR*VYRHHHESHNPKTSSEVHIPLREARLVIKTY*GLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVRPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGAGTTTACAGACATCACCATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAAGGGAAGCAAGATTAGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGGCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAG -MK115095.1,vpr,4963,5254,5558,5843,forward,0.6112852664576804,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAA -MK115095.1,tat_exon1,5111,5453,5830,6046,forward,0.6409453748630458,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ,MEILGQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPNLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAACTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCCATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115095.1,rev_exon1,5373,5454,5969,6047,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115095.1,vpu,5465,5711,6259,6310,forward,0.7683007254341614,MHALEIAAIVRLVVAAIIAIVV,MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAAGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAAGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAG -MK115095.1,env,5628,8229,6224,8795,forward,0.7513561129398668,MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD,MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATGAGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAAGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATGAATTAAATCTAAATTGCCCTAACAATAATACTTGTAGTAATAATACTAAATATAATATGACGGAAGAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAAGTAGTGGAAATACTACAGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAAGGAGGGCATTTTATAGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTAGGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAAAGGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAAGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAATACTTAGAATGGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATAGTAAGAGCAACAATAGTAGTAATGATACAAAGACCTTCAGGCCTAGAAGAGGAGATATGAAGGACAATTAGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAGAAAGAAAAAAGAGCAATAGGACTTAGAGCTTTCTTCCTTAAGTTCTTAGGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTGAAGATTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTAATGTGCCCTAAAATGTTAGTTAGAGCCCTAGATAGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAGGAAAAAGAAATTGACAATTATACAGACACAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAA -MK115095.1,nef,7624,8872,8796,9417,forward,0.5872017754762344,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MNKTY*H*ISRQVCRISLTLHSGYSI*KYS****EA**V*E*FLLYCL**IELGRDTHHCHCRPSSQPRGDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*ETYS*LWRGL*NF*DAESKKH*SIGRISCSIRVRK*RIVQLACSTPQQ*Q*LKGQIRL*KYYKEALELFSTYLHE*DRA*KKLCYKIGNKLSRRLRARWPAIKERMRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAGGGCTAGATGGCCTGCCATAAAAGAAAGAATGAGACAAGCTAGGCCAGTAAGAAAGCCAGAGCCAGCAGCAACTAAGGTAAGAGCAGCATCTCGAGACCTAGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGGAAGAAAAAGAGGTAGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAAGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAAGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATAGAAGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA -MK115095.1,tat_exon2,7810,7903,8376,8469,forward,0.5303030303030303,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAG -MK115095.1,rev_exon2,7811,8087,8377,8653,forward,0.6667847862036381,ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE,DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG +MK115095.1,vpr,4963,5254,5558,5849,forward,0.4464285714285715,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAA +MK115095.1,tat_exon1,5111,5453,5829,6045,forward,0.6409453748630458,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ,MEILGQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPNLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAACTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCCATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115095.1,rev_exon1,5373,5454,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK115095.1,vpu,5465,5711,6060,6309,forward,0.7521692502681095,MHALEIAAIVRLVVAAIIAIVV,MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAAGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAAGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAG +MK115095.1,env,5628,8229,6223,8794,forward,0.7513561129398668,MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD,MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATGAGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAAGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATGAATTAAATCTAAATTGCCCTAACAATAATACTTGTAGTAATAATACTAAATATAATATGACGGAAGAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAAGTAGTGGAAATACTACAGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAAGGAGGGCATTTTATAGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTAGGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAAAGGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAAGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAATACTTAGAATGGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATAGTAAGAGCAACAATAGTAGTAATGATACAAAGACCTTCAGGCCTAGAAGAGGAGATATGAAGGACAATTAGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAGAAAGAAAAAAGAGCAATAGGACTTAGAGCTTTCTTCCTTAAGTTCTTAGGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTGAAGATTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTAATGTGCCCTAAAATGTTAGTTAGAGCCCTAGATAGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAGGAAAAAGAAATTGACAATTATACAGACACAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAA +MK115095.1,nef,7624,8872,8795,9416,forward,0.5833488893037148,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MNKTY*H*ISRQVCRISLTLHSGYSI*KYS****EA**V*E*FLLYCL**IELGRDTHHCHCRPSSQPRGDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*ETYS*LWRGL*NF*DAESKKH*SIGRISCSIRVRK*RIVQLACSTPQQ*Q*LKGQIRL*KYYKEALELFSTYLHE*DRA*KKLCYKIGNKLSRRLRARWPAIKERMRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAGGGCTAGATGGCCTGCCATAAAAGAAAGAATGAGACAAGCTAGGCCAGTAAGAAAGCCAGAGCCAGCAGCAACTAAGGTAAGAGCAGCATCTCGAGACCTAGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGGAAGAAAAAGAGGTAGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAAGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAAGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATAGAAGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115095.1,tat_exon2,7810,7903,8375,8471,forward,0.5303030303030303,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAG +MK115095.1,rev_exon2,7811,8087,8376,8652,forward,0.6667847862036381,ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE,DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG MK115490.1,gag,549,2049,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115490.1,pol,1841,4853,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115490.1,vif,4797,5376,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115490.1,vpr,5315,5606,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115490.1,tat_exon1,5586,5805,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115490.1,rev_exon1,5725,5806,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115490.1,env,5980,8521,6224,8795,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115490.1,vpu,6018,6063,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115490.1,tat_exon2,8102,8198,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115490.1,rev_exon2,8103,8379,8377,8653,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115490.1,nef,8522,9137,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115490.1,vpr,5315,5606,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115490.1,tat_exon1,5586,5805,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115490.1,rev_exon1,5725,5806,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115490.1,vpu,5817,6063,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115490.1,env,5980,8521,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115490.1,tat_exon2,8102,8198,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115490.1,rev_exon2,8103,8379,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115490.1,nef,8522,9137,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA MK115576.1,gag,468,1968,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA MK115576.1,pol,1760,4772,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MK115576.1,vif,4716,5295,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115576.1,vpr,5234,5525,5558,5843,forward,0.5872120921305184,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115576.1,tat_exon1,5505,5724,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115576.1,rev_exon1,5644,5725,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115576.1,env,5899,8440,6224,8795,forward,0.45675101255163,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115576.1,vpu,5937,5982,6259,6310,forward,0.46723952738990326,MEMGHHAPGDVDDL,MEMGHHAPGDVDDL*,ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115576.1,tat_exon2,8021,8117,8376,8469,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115576.1,rev_exon2,8022,8298,8377,8653,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115576.1,nef,8441,9056,8796,9417,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115576.1,vpr,5234,5525,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115576.1,tat_exon1,5505,5724,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115576.1,rev_exon1,5644,5725,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115576.1,vpu,5736,5982,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115576.1,env,5899,8440,6223,8794,forward,0.4583799776107468,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115576.1,tat_exon2,8021,8117,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115576.1,rev_exon2,8022,8298,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115576.1,nef,8441,9056,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA OQ092466,gag,825,2361,789,2292,forward,0.2559303794507086,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTAGCCTGTTAGAAACAGCAGAAGGCTGTAGACAAATATTGGGACAGTTACAACCGTCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACATTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCCTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGCAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGCCAGGTTAGACACACAGGAAACAGCAGCCAGGTCAGCCAAAATTACCCTATAGTACAGAACCTTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGACTACATCCAGTGCATGCAGGGCCCATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTACACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGGGGACCCGGACATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCACGTAACAAATTCAAGTGCCATAATGATGCAGAGGGGCAATTTTAGAAACCAAAGAAAGGCTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA OQ092466,pol,2147,5165,2084,5096,forward,0.19193360134872262,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGGGCAGATGATACAGTATTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAGGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTATTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGTATGACAAAAATCTTAGAGCCTTATAGAACACGAAATCCAGAAATGGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGACTTAGAAATAGGGCAACATAGAGCAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGATTTACTACCCCAGACAAAAAACATCAAAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAAACAAAGACAGCTGGACTGTCAATGACATACAGAAACTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCGCTAACAGAAGAAGCAGAGTTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGGGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGGAAGGACAATGGACATTTCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGCGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAGGCATAGTAATATGGGGAAAAATTCCTAAATTTAGACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATACGCATTGGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTGATAAAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTGCTGGAATCAGGAAAGTATTATTTTTAGATGGAATAGAGAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGCTAAAAGGAGAAGCCATACATGGACAGGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATACGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATCCAAACCAAAGAACTACAAAAACAAATTATAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTTATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG OQ092466,vif,5109,5688,5040,5619,forward,0.24677296886864086,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAGGAAAGCTAAGGGATGGTTTTATAGACATCACTTTGAAAGCAATCATCCAAAAATAAGTTCAGAAGTACACATCCCACTGGAGGATGCTAGACTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGGGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTACTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACACATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGAGAAAGCCACCCTTGCCTAGTGTTAAGAAGCTAACAGAAGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -OQ092466,vpr,5627,5918,5558,5843,forward,0.5625083211290103,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAGCTTAGGGCAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATTCTGCAACAACTGTTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -OQ092466,tat_exon1,5898,6117,5830,6046,forward,0.40192926045016075,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ*,ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAA -OQ092466,rev_exon1,6037,6118,5969,6047,forward,0.4807692307692307,MAGRSGDSDDELLKTVRLIKVLYQSSK,MAGRSGDSDDELLKTVRLIKVLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAAG -OQ092466,vpu,6129,6375,6259,6310,forward,0.7548091006737623,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*,ATGCAACCTTTAACAATATTAGCAATAGTAGCACTAGTAGTAGCAGCAATACTAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAA -OQ092466,env,6292,8875,6224,8795,forward,0.4841544358231281,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*,ATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAATGCTACAGAACAACAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGGTATTAAAAAATGTGACAGAAAATTTTAATATGTGGGAAAATAACATGGTAGAACAGATGCATGAAGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAGTTAACTCCACTCTGTGTTACTCTAAATTGCACTAATACCACTAGGAGTAGTGGAAATACTACCAATGAAATGAAAAACTGCTCTTTCTATACCGAAACAGACATAAGAGATAAGAAGAGAAAGGAATATGCACTTTTTTATGAACTTGATATAGTACCCATAGATGAGGATAATAAGAATAAGAGTAATAATATTAGCTATTCTAGGTTAATAAGTTGCAACACCTCAGTTATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAGAAATTCAATGGAACAGGGCCATGTACAAATGTCAGCACAGTGCAATGTACACATGGTATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGACGAGGTAGTAATTAAATCTAGCAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTAAATGAAACTGTAAAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGACATAAGACAAGCACATTGTAACATCTCTAGAGCAAACTGGACAAACACTTTAAAACAGATAGCTGAAAAATTAGGAAAACAATTTGAGGAAAATAAAACAATAGTCTTTAATCCCTCCTCAGGAGGGGACCCAGAGGTTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATTCAACACCACTGTTTAATAGTACTTGGAAGGAGACTAATGGGATTTGGACTCGTATTGGAGAGTCAAATGATAGTGCTACTATCACACTAAATGATAGTGATACTATCACACTCCAATGTAAAATAAGGCAAATTATAAACTTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAAAGGACAAATTAGCTGTTTATCAAACATTACAGGGCTGCTATTAGTAAGAGATGGTGGCAATAACACGAACGGGACCGAGATCTTCAGACCTGTAGGAGGAGAAATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAGAAAAGAGCGACATTGGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGTAATAAATCTCTGGAAAAAATTTGGAATAATATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACCTTACTTGAAGAATCGCAGAACCAGCAAGAAAAAAATGAAAAAGAATTATTGGAATTAGATACATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAATAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTCCAGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAATATTACAAAGAGCTTGTAGAGCTATTCTCCATATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -OQ092466,tat_exon2,8456,8552,8376,8469,forward,0.5303030303030303,RSTPQLRGDPTGPKESKEKVERETETDPVH,RSTPQLRGDPTGPKESKEKVERETETDPVH**,AGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGA -OQ092466,rev_exon2,8457,8733,8377,8653,forward,0.3690449563855961,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE*,GATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAG -OQ092466,nef,8876,9509,8796,9417,forward,0.4195274186357557,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*,ATGGGTGGCAAATGGTCAAAAAGTAAGCTATTTGGATGGCCTGCTGTAAGGGAAAGAATGAGAAGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACACGGAGCAATCACAAGTAGCAATACACCAACTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCGGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGATCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAATAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092466,vpr,5627,5918,5558,5849,forward,0.2608047690014903,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAGCTTAGGGCAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATTCTGCAACAACTGTTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +OQ092466,tat_exon1,5898,6117,5829,6045,forward,0.40192926045016075,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ*,ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAA +OQ092466,rev_exon1,6037,6118,5968,6046,forward,0.4807692307692307,MAGRSGDSDDELLKTVRLIKVLYQSSK,MAGRSGDSDDELLKTVRLIKVLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAAG +OQ092466,vpu,6129,6375,6060,6309,forward,0.5077548005908421,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*,ATGCAACCTTTAACAATATTAGCAATAGTAGCACTAGTAGTAGCAGCAATACTAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAA +OQ092466,env,6292,8875,6223,8794,forward,0.48559709145147756,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*,ATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAATGCTACAGAACAACAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGGTATTAAAAAATGTGACAGAAAATTTTAATATGTGGGAAAATAACATGGTAGAACAGATGCATGAAGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAGTTAACTCCACTCTGTGTTACTCTAAATTGCACTAATACCACTAGGAGTAGTGGAAATACTACCAATGAAATGAAAAACTGCTCTTTCTATACCGAAACAGACATAAGAGATAAGAAGAGAAAGGAATATGCACTTTTTTATGAACTTGATATAGTACCCATAGATGAGGATAATAAGAATAAGAGTAATAATATTAGCTATTCTAGGTTAATAAGTTGCAACACCTCAGTTATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAGAAATTCAATGGAACAGGGCCATGTACAAATGTCAGCACAGTGCAATGTACACATGGTATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGACGAGGTAGTAATTAAATCTAGCAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTAAATGAAACTGTAAAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGACATAAGACAAGCACATTGTAACATCTCTAGAGCAAACTGGACAAACACTTTAAAACAGATAGCTGAAAAATTAGGAAAACAATTTGAGGAAAATAAAACAATAGTCTTTAATCCCTCCTCAGGAGGGGACCCAGAGGTTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATTCAACACCACTGTTTAATAGTACTTGGAAGGAGACTAATGGGATTTGGACTCGTATTGGAGAGTCAAATGATAGTGCTACTATCACACTAAATGATAGTGATACTATCACACTCCAATGTAAAATAAGGCAAATTATAAACTTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAAAGGACAAATTAGCTGTTTATCAAACATTACAGGGCTGCTATTAGTAAGAGATGGTGGCAATAACACGAACGGGACCGAGATCTTCAGACCTGTAGGAGGAGAAATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAGAAAAGAGCGACATTGGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGTAATAAATCTCTGGAAAAAATTTGGAATAATATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACCTTACTTGAAGAATCGCAGAACCAGCAAGAAAAAAATGAAAAAGAATTATTGGAATTAGATACATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAATAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTCCAGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAATATTACAAAGAGCTTGTAGAGCTATTCTCCATATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +OQ092466,tat_exon2,8456,8552,8375,8471,forward,0.5303030303030303,RSTPQLRGDPTGPKESKEKVERETETDPVH,RSTPQLRGDPTGPKESKEKVERETETDPVH**,AGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGA +OQ092466,rev_exon2,8457,8733,8376,8652,forward,0.3690449563855961,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE*,GATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAG +OQ092466,nef,8876,9509,8795,9416,forward,0.411658382286489,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*,ATGGGTGGCAAATGGTCAAAAAGTAAGCTATTTGGATGGCCTGCTGTAAGGGAAAGAATGAGAAGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACACGGAGCAATCACAAGTAGCAATACACCAACTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCGGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGATCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAATAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA OQ092463,gag,801,2313,140,1643,forward,0.2589641434262949,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAGCGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAACACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGACCAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTCAGGAACCAGAGAAAGAATGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA OQ092463,pol,2105,5117,1435,4447,forward,0.14797358397500882,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAGTCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAGCTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAGCAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCTATAGTAGGAGCAGAAACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGACCATGAGAAATATCACAGTAATTGGAGGGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGGTATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCAGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG OQ092463,vif,5061,5640,4391,4970,forward,0.32379004771642805,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTATTCATCCAAGAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAGGAGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATCGGTATTACTTTGATTGTTTTTCAGAATCTGCCATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG @@ -420,14 +420,14 @@ OQ092465,nef,8882,9515,8209,8842,forward,0.3463855421686747,MGGKWSKSSVVGWPKIRERM OQ092462,gag,767,2270,789,2292,forward,0.316486214000789,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAGCTAAAACATATAGTATGGGCAAGCAGGGAACTAGAGCGATTTGCAGTTAATCCCGGCCTGTTAGAAACATCGGAGGGCTGTAGACAAATACTAGGGCAACTACAGCCCGCTCTTCAGACAGGATCAGAAGAACTTAAATCACTATTTCATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTGAAAGACACCAAAGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAAGAAAAGTAAGAAAAAGGCACAGCAAGCAGCCGCTGACACAGGAAATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGACAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGATAAGGCTTTCAGTCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCAGGCAGGGCCTGTTGCGCCAGGCCAGCTACGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAGCAAATAGCATGGATGACACATAATCCACCTGTCCCAGTAGGAGAAATCTATAAAAGATGGATACTTCTGGGATTAAATAAAATAGTAAGAATGTACAGCCCCGTCAGCATTCTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCTGAGCAGGCTTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAGCAAATCCAGCTAGCATAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGCCTATTAAGTGTTTCAACTGTGGCAAAGAGGGGCATATTGCTAAAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA OQ092462,pol,2062,5074,2084,5096,forward,0.1943357603710517,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTTTTAGAAGAAATGAATTTGCCAGGAAAATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGCTGCACTTTAAATTTTCCCATTAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATCTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAGAAAGATGGTAATAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCTGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAGGACTTCAGGAAGTATACTGCATTTACAATACCTAGCACAAACAATGAGACACCAGGGATTAGATACCAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTGGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATTTATCAATACATGGATGATTTATATGTAGGGTCTGACTTAGAAATAGGGCAGCATAGAGCAAAAATAGAGGAACTGAGACAACATCTATTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCCGATAAATGGACAGTACAGCCTATATTGCTGCCAGAAAAAGACAGCTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATCAAAGTAAGGCAGCTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTGGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGATTTAATAGCAGAACTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATATAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGAGGTACCCACACTAATGATATAAAACAATTAACAGAGGCAGTGCAAAAAATAGCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAATTACCCATACAAAAGGAAACATGGGAAGCATGGTGGATAGAGTATTGGCAAGCCACCTGGATTCCTGAATGGGAGTTTGTCAATACCCCTCCCTTAGTGAAACTATGGTACCAGTTGGAAAAAGAACCCATAGTGGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAAACTAAATTAGGAAAAGCAGGATATGTTACTGACAAAGGAAGACAAAAAGTTGTCCCCCTAACGGACACAACAAATCAGAAGACTGAGCTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAACTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAGTTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTATAGTAGCAAAGGAAATAGTAGCCAGTTGTGACAAATGTCAGTTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCTGGAATATGGCAGCTAGATTGTACACATCTAAAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTGAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCTGCCTGTTGGTGGGCGGGGATCAAACAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCAGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCGTCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACCAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATCAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG OQ092462,vif,5018,5597,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAGAGTTTAGTAAAACATCATATGCATATATCAAGGAAAGCTAAGAATTGGTTGTATAGACATCACTATGAAAGCATTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAGTAATAACAACATATTGGGGTCTGCTTACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAGGAGATATAGAACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCTTATTAGGACGTGTAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACCAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAG -OQ092462,vpr,5536,5827,5558,5843,forward,0.5656050955414005,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAACTTAAAAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTTCATGGATTGGGACAGCATATCTATGAAACATATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCGACATAGCAGAATAGGCATTAATCTACAGAGGAGAGCAAGGAATGGATCCAGTAGATCCTAG -OQ092462,tat_exon1,5807,6026,5830,6046,forward,0.37688442211055273,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ*,ATGGATCCAGTAGATCCTAGCCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGTTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAA -OQ092462,rev_exon1,5946,6027,5969,6047,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKFLYQSSK,MAGRSGDSDEELLKAVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAAG -OQ092462,vpu,6038,6284,6259,6310,forward,0.7548091006737623,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*,ATGCGACCTTTAGAAATAGCAGCAATAGTAGCACTAGTAGTAGCAGTACTAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAGTGGATAGAATAAGAGAAAGAGCAGAAGATAGTGGAAATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAG -OQ092462,env,6201,8778,6224,8795,forward,0.5096088152339575,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAGTGCCACAGAGAACTTGTGGGTCACAGTCTACTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAGATGCCAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAGCCCACAAGAAGTAGTATTGAAAAATGTGACAGAAAAGTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATCAGGATATAATCAGTTTATGGGATGAAAGCCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATGCTACTATCAGTGGTAATGCAACAGAAGAAATAAAAAACTGCTCTTTCAATGTCAATACAAAAATAGGAGGTAAGAAGCAGAAAGAACGTGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAGTACTAATAGGACTAATACCAGCTATAGGTTGATAAGTTGTAACACTTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTGGAGATAAAGAGTTCAATGGAACAGGACTATGTAGAAATGTCAGCACAGTCCAATGTACACATGGAATCAGGCCAGTAGTATCAACTCAATTGCTGTTGAATGGCAGTCTAGCAGAAGGAGAGGTAGTAATTAAATCTGAAAATATCACGAACAATGTTAAAACCATAATAGTACAGCTAAATGAAACTGTATCAATTAATTGTACAAGACCTAGCAACAATACAAGAAGAAGCATACATATGGGACCAGGGAGAGCCTTTTATGCAACAGGAGAAATAATAGGAGATATAAGGAAAGCACAGTGTATCCTGAATAAGACAGACTGGAGTGACACTTTAACAAGGATAGCTAAAAAATTACACAAGCAATTTCATGGACCAATAGCATTTGAGCAATCCTCAGGAGGGGACCCTGAAATTACAATGCACACTTTTAATTGTGGAGGGGAATTTTTCTACTGCAACACATCAGCGTTGTTTAGCGGGACCTGGAATGGTACTGCTTGGACTAATGCTACTTGGGGTAATATTGCAGGTAACAATATCACACTCCAATGCAGAATAAAACAATTTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGAGAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGCAGTAACACAACAAATGGTGGCGAGAATGGGACCCAGATTGGCGAGAATGTGACCCAGATCTTCAGACCTGGAGGAGGGGATATGAGGGACAATTGGAGAAGTGAATTATACAAATATAAAGTAGTAAAAATTGAGCCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTAACATTCGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACACTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTTCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAAAAAATTTGGGGGAACATGACCTGGATGGAGTGGGAGAGAGAAATTGACAATTATACAGACTTAATATACACCTTAATTGAACAATCGCAGAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAGGCTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGTTTAGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTATCATTCCAGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGTTTGCTTAATGCTATAGCTATATCAGTAGCGGAGGGAACAGATAGGATTATAGAAGCAATACAAAGAATTTGTAGAGCTATCTTACACATACCTACAAGGATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -OQ092462,tat_exon2,8359,8455,8376,8469,forward,0.4542873367404884,RPASQPRGDPTGPKEPTKKVERETETDPDH,RPASQPRGDPTGPKEPTKKVERETETDPDH**,AGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGA -OQ092462,rev_exon2,8360,8636,8377,8653,forward,0.38952607660679506,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE*,GACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG -OQ092462,nef,8779,9406,8796,9417,forward,0.5105263157894737,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*,ATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAAGCCAGAAGATGAGCCAGCAGCAAATGGGGTGGGGGCAGCATCTCGAGACTTGGAGAAATATGGCGCACTCACAAGTAGCAATACAGTAGCTACTAATGCTGATTTAGCTTGGCTAGAAGCACAAGAGGAAGAGGAGGTGGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTCTAGATCTCAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGGTTCACCACACACAAGGCTATCTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACCCGGAGAAAGAAGTCTTAATGTGGAAGTTTGACAGCCACCTAGCATTCCGTCACATGGCCCGAGAGCTGCATCCGGAGTATTACAAAGACTGCTGA +OQ092462,vpr,5536,5827,5558,5849,forward,0.2608047690014903,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAACTTAAAAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTTCATGGATTGGGACAGCATATCTATGAAACATATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCGACATAGCAGAATAGGCATTAATCTACAGAGGAGAGCAAGGAATGGATCCAGTAGATCCTAG +OQ092462,tat_exon1,5807,6026,5829,6045,forward,0.37688442211055273,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ*,ATGGATCCAGTAGATCCTAGCCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGTTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAA +OQ092462,rev_exon1,5946,6027,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKFLYQSSK,MAGRSGDSDEELLKAVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAAG +OQ092462,vpu,6038,6284,6060,6309,forward,0.5464940306036659,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*,ATGCGACCTTTAGAAATAGCAGCAATAGTAGCACTAGTAGTAGCAGTACTAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAGTGGATAGAATAAGAGAAAGAGCAGAAGATAGTGGAAATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAG +OQ092462,env,6201,8778,6223,8794,forward,0.5083167934238491,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAGTGCCACAGAGAACTTGTGGGTCACAGTCTACTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAGATGCCAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAGCCCACAAGAAGTAGTATTGAAAAATGTGACAGAAAAGTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATCAGGATATAATCAGTTTATGGGATGAAAGCCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATGCTACTATCAGTGGTAATGCAACAGAAGAAATAAAAAACTGCTCTTTCAATGTCAATACAAAAATAGGAGGTAAGAAGCAGAAAGAACGTGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAGTACTAATAGGACTAATACCAGCTATAGGTTGATAAGTTGTAACACTTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTGGAGATAAAGAGTTCAATGGAACAGGACTATGTAGAAATGTCAGCACAGTCCAATGTACACATGGAATCAGGCCAGTAGTATCAACTCAATTGCTGTTGAATGGCAGTCTAGCAGAAGGAGAGGTAGTAATTAAATCTGAAAATATCACGAACAATGTTAAAACCATAATAGTACAGCTAAATGAAACTGTATCAATTAATTGTACAAGACCTAGCAACAATACAAGAAGAAGCATACATATGGGACCAGGGAGAGCCTTTTATGCAACAGGAGAAATAATAGGAGATATAAGGAAAGCACAGTGTATCCTGAATAAGACAGACTGGAGTGACACTTTAACAAGGATAGCTAAAAAATTACACAAGCAATTTCATGGACCAATAGCATTTGAGCAATCCTCAGGAGGGGACCCTGAAATTACAATGCACACTTTTAATTGTGGAGGGGAATTTTTCTACTGCAACACATCAGCGTTGTTTAGCGGGACCTGGAATGGTACTGCTTGGACTAATGCTACTTGGGGTAATATTGCAGGTAACAATATCACACTCCAATGCAGAATAAAACAATTTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGAGAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGCAGTAACACAACAAATGGTGGCGAGAATGGGACCCAGATTGGCGAGAATGTGACCCAGATCTTCAGACCTGGAGGAGGGGATATGAGGGACAATTGGAGAAGTGAATTATACAAATATAAAGTAGTAAAAATTGAGCCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTAACATTCGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACACTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTTCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAAAAAATTTGGGGGAACATGACCTGGATGGAGTGGGAGAGAGAAATTGACAATTATACAGACTTAATATACACCTTAATTGAACAATCGCAGAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAGGCTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGTTTAGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTATCATTCCAGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGTTTGCTTAATGCTATAGCTATATCAGTAGCGGAGGGAACAGATAGGATTATAGAAGCAATACAAAGAATTTGTAGAGCTATCTTACACATACCTACAAGGATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092462,tat_exon2,8359,8455,8375,8471,forward,0.4034761018001243,RPASQPRGDPTGPKEPTKKVERETETDPDH,RPASQPRGDPTGPKEPTKKVERETETDPDH**,AGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGA +OQ092462,rev_exon2,8360,8636,8376,8652,forward,0.38952607660679506,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE*,GACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092462,nef,8779,9406,8795,9416,forward,0.5049429657794677,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*,ATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAAGCCAGAAGATGAGCCAGCAGCAAATGGGGTGGGGGCAGCATCTCGAGACTTGGAGAAATATGGCGCACTCACAAGTAGCAATACAGTAGCTACTAATGCTGATTTAGCTTGGCTAGAAGCACAAGAGGAAGAGGAGGTGGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTCTAGATCTCAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGGTTCACCACACACAAGGCTATCTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACCCGGAGAAAGAAGTCTTAATGTGGAAGTTTGACAGCCACCTAGCATTCCGTCACATGGCCCGAGAGCTGCATCCGGAGTATTACAAAGACTGCTGA OQ092464,gag,773,2276,200,1700,forward,0.3910844507174782,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAGCCAGCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATCGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCGCTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTAAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCTCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA OQ092464,pol,2068,5080,1492,4504,forward,0.21863141758600757,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAATACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAGAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGTAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAGACTACCCATACAAAGAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAGACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGACGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAGAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG OQ092464,vif,5024,5603,4448,5027,forward,0.3264662839130924,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTACTCATCCAAGAATAAGTTCAGAAGTTCACATCCCGCTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAGAAGAGATATAGCACACAAGTAGACCCTGGCTTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGCTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG @@ -442,11 +442,11 @@ OQ092464,nef,8791,9412,8209,8842,forward,0.36363636363636354,MGGKWSKSSVVGWPAIRER OQ092467,gag,808,2308,789,2292,forward,0.2880084183556755,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAAAAACAATACAAATTAAAACATCTAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTTCTAGAGACATCAGAAGGGTGTAGACAAATACTGGGACAGCTACAACCAGCTCTTCAGACAGGATCAGAAGAATTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAAATAGAGGAAGAGCAAAACCAAAGTAAGAAAAAAGCAGCAGCTGCAGCAGCTGACACAGGAAACAGAAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCTTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAATAGGTGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAGGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATTCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTGAGAGCCGAGCAAGCAACACAGGAAGTAAAGAATTGGATGACAGAAACTTTGCTGGTCCAAAATGCAAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCAGGCCACAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAACTGTAATGATGCAGAGAGGCAATTTTAGGAATCAAAGAAAGACAGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCATATAGCAAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAAAGAAGGGCACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA OQ092467,pol,2100,5112,2084,5096,forward,0.1880239208210378,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAAATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGATATGAATTTACCAGGAAAATGGAAACCAAAAATGATAGGAGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGCTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCGCATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCCTATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTACACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGGATATTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTGGGATCTGACTTAGAAATAGGACAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAAAGCTGCCAGAAAAAGATAGCTGGACTGTCAATGACATCCAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGAATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACTAAAGCACTAACAGAAGTAGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCAACGAAAGACCTAATAGCAGAACTACAGAAGCAGGGGCAAAGTCAATGGACATATCAAATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGGGGTGCCCACACTAATGATGTGAAACAATTAACAGAGGCAGTGCAAAAAATAGCCATAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAAATTACCTATACAAAAAGAAACATGGGAAACATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGATTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAAAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAGATCAGGCAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCCCCCTAACAGACACAACAAACCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTGACAGACTCACAATATGCACTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGGAAGATACTATTTTTAGATGGAATAACTAAGGCCCAAGATGATCATGAGAGATACCACAGCAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTATAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCACGCATGGACAAGTAGACTGCAGTCCAGGAATATGGCAACTAGATTGTACGCATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTAAAACTAGCAGGAAGATGGCCAGTAAAGACAGTACATACAGATAATGGCAGCAATTTCACCAGTGCTGCGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAAAGTCAAGGAGTCATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAGAAACAAATCACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAGGCAAAGATCATTAGAGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG OQ092467,vif,5056,5635,5040,5619,forward,0.41532297468972923,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATACATGTCTCAAAGAAAGCTAAGGGATGGGTTTATAGACACCACTATGAAAGCACCCATCCAAGAATAAGTTCAGAAGTACATATCCCGCTAGGGGAAGCTAGATTAGTAATAGCAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAAGAAATATATCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGCATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCATAGTAGGACGTTTAGTTAGCCCTCAGTGTGAATATCAAACAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGTAGCATTAATAACGCCAAAAAAGAGAAAGCCACCTTTGCCTAGTGTTAGGAAATTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAG -OQ092467,vpr,5574,5865,5558,5843,forward,0.5793112277557293,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAGAGGAACTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAACTTAGGACAATACATCTATGCAACTTATGGGGATACTTGGACAGGAGTGGAAGCTTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCAACATAGCAGAATAGGCATTACTCGACAGAGGAGAGCAAGGAATGGAGCCAGTAGATCCTAG -OQ092467,tat_exon1,5845,6064,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTCTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAA -OQ092467,rev_exon1,5984,6065,5969,6047,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKQLYQSSK,MAGRSGDSDEDLLKTVRLIKQLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAAG -OQ092467,env,6239,8807,6224,8795,forward,0.4718646278993922,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAGTGCTAAAGAACAATTGTGGGTCACAGTTTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAAATGCTAAAGCATATGACCCAGAGGTGCATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACAAGAAGTACCATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGACATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTATTTTAAATTGCACTAATGTGAATGTTACTACTAACAATAATAGTAGTAGTGAGGAACAGATGGAGGTAGGAGAAATAAAAAACTGCTCTTTCAATATTGCCACAAGAATAAAAAATAAGATAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAATAGAGGATGATAATACAAGCTATATGTTGATAAATTGTAATACCTCAGTCACTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATACTAAAATGTAATGATAAAAAGTTCAATGGAACAGGACCATGTAACAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGATAGTAGTTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTGAATAAAACTATAGAAATTAATTGTATAAGACCCAACAATAATACAAGAAAAAGTATATCTTTAAGACCGGGGCAAGCAATTTATGCAACAGAAGACATAATAGGAAATATAAGACAAGCACATTGTAACATTAGGAGAAAAGACTGGGATAAAGCTTTAGAACAGGTAGTTGCAAAATTAAGAGAACAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGAGACCCAGAAATTGTAATGCATAGTTTTAATTGTGCAGGGGAATTTTTCTACTGTAACACAACAAAGCTGTTTAATAGTACTTGGAATGTTAATAACACTCGGAATAATACTACTGATAATAGCACCATCACTCTCCCGTGCAGAATAAAACAAATTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCTCCTCCCATCAAAGGGCAAATTAAATGTTCATCAAATATTACAGGGTTATTATTAACAAGAGATGGTGGTGTCCGCGAGGACAACGCCCCTGAGATCTTTAGACCTGGAGGAGGAGATATGAGGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTGGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAAAGAGGAAAAAGAGCAGTAACGCTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACTTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTACCTTGGAATACTAGTTGGAGTAATAAATCTTTGGAAAAGATTTGGAAAAACATGACCTGGATGGAGTGGGAGAAAGAAATTAACAATTACACAAGGACAATATACACCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAGGAATTATTGGAATTGGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATCATGATAGTAGGAGGTATAGTAGGGTTAAGAATAGTTTTTACTGTGCTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTGTCATTCCAGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAGTTTGCTTAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAATTGGTAGAGCTATTCTCCACATCCCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -OQ092467,vpu,6283,6340,6259,6310,forward,0.4380664652567977,MGHHVEMGHHAPWNVDDL,MGHHVEMGHHAPWNVDDL*,ATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG -OQ092467,tat_exon2,8388,8484,8376,8469,forward,0.4918032786885247,RPASQLRGDQTGPKEQKKKVERETETDPGN,RPASQLRGDQTGPKEQKKKVERETETDPGN**,AGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGA -OQ092467,rev_exon2,8389,8674,8377,8653,forward,0.4123815285339786,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC*,GACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAG -OQ092467,nef,8808,9417,8796,9417,forward,0.49080954243253805,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*,ATGGGTGGCAAGTGGTCAAAATGTAGTCTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCTCCAGCAGCAGAAGGGGTGGGAGCAGCATCTCGAGACTTGGAAAAACATGGAGCACTCACAACTAGTAATACAGCAGCTAATAATGCTGCTTGTGCCTGGCTGGAAGCACAAGAGGAGGAAGAGGTGGGGTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGGAGCTATGGATCTTGGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCCAAAAAGACAAGAAATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTATACACCAGGGCCAGGGACTAGATATCCATTAACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATGAAGGAGAGAATAGCTGTTTGCTACACCCGATGAACCAGCATGGGGCAGATGACACAGAAAGAGAAGTATTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAAGGCCCGAGAGCTGCATCCGGAGTACTACAAAAACTGCTGA +OQ092467,vpr,5574,5865,5558,5849,forward,0.3120665742024965,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAGAGGAACTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAACTTAGGACAATACATCTATGCAACTTATGGGGATACTTGGACAGGAGTGGAAGCTTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCAACATAGCAGAATAGGCATTACTCGACAGAGGAGAGCAAGGAATGGAGCCAGTAGATCCTAG +OQ092467,tat_exon1,5845,6064,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTCTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAA +OQ092467,rev_exon1,5984,6065,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKQLYQSSK,MAGRSGDSDEDLLKTVRLIKQLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAAG +OQ092467,vpu,6076,6340,6060,6309,forward,0.4955621301775147,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL*,ATGCAACCCTTAGTAATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAGAAAGATAGATAGCATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG +OQ092467,env,6239,8807,6223,8794,forward,0.4703403690377699,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAGTGCTAAAGAACAATTGTGGGTCACAGTTTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAAATGCTAAAGCATATGACCCAGAGGTGCATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACAAGAAGTACCATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGACATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTATTTTAAATTGCACTAATGTGAATGTTACTACTAACAATAATAGTAGTAGTGAGGAACAGATGGAGGTAGGAGAAATAAAAAACTGCTCTTTCAATATTGCCACAAGAATAAAAAATAAGATAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAATAGAGGATGATAATACAAGCTATATGTTGATAAATTGTAATACCTCAGTCACTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATACTAAAATGTAATGATAAAAAGTTCAATGGAACAGGACCATGTAACAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGATAGTAGTTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTGAATAAAACTATAGAAATTAATTGTATAAGACCCAACAATAATACAAGAAAAAGTATATCTTTAAGACCGGGGCAAGCAATTTATGCAACAGAAGACATAATAGGAAATATAAGACAAGCACATTGTAACATTAGGAGAAAAGACTGGGATAAAGCTTTAGAACAGGTAGTTGCAAAATTAAGAGAACAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGAGACCCAGAAATTGTAATGCATAGTTTTAATTGTGCAGGGGAATTTTTCTACTGTAACACAACAAAGCTGTTTAATAGTACTTGGAATGTTAATAACACTCGGAATAATACTACTGATAATAGCACCATCACTCTCCCGTGCAGAATAAAACAAATTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCTCCTCCCATCAAAGGGCAAATTAAATGTTCATCAAATATTACAGGGTTATTATTAACAAGAGATGGTGGTGTCCGCGAGGACAACGCCCCTGAGATCTTTAGACCTGGAGGAGGAGATATGAGGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTGGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAAAGAGGAAAAAGAGCAGTAACGCTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACTTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTACCTTGGAATACTAGTTGGAGTAATAAATCTTTGGAAAAGATTTGGAAAAACATGACCTGGATGGAGTGGGAGAAAGAAATTAACAATTACACAAGGACAATATACACCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAGGAATTATTGGAATTGGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATCATGATAGTAGGAGGTATAGTAGGGTTAAGAATAGTTTTTACTGTGCTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTGTCATTCCAGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAGTTTGCTTAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAATTGGTAGAGCTATTCTCCACATCCCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092467,tat_exon2,8388,8484,8375,8471,forward,0.4918032786885247,RPASQLRGDQTGPKEQKKKVERETETDPGN,RPASQLRGDQTGPKEQKKKVERETETDPGN**,AGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGA +OQ092467,rev_exon2,8389,8674,8376,8652,forward,0.4123815285339786,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC*,GACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAG +OQ092467,nef,8808,9417,8795,9416,forward,0.484764542936288,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*,ATGGGTGGCAAGTGGTCAAAATGTAGTCTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCTCCAGCAGCAGAAGGGGTGGGAGCAGCATCTCGAGACTTGGAAAAACATGGAGCACTCACAACTAGTAATACAGCAGCTAATAATGCTGCTTGTGCCTGGCTGGAAGCACAAGAGGAGGAAGAGGTGGGGTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGGAGCTATGGATCTTGGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCCAAAAAGACAAGAAATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTATACACCAGGGCCAGGGACTAGATATCCATTAACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATGAAGGAGAGAATAGCTGTTTGCTACACCCGATGAACCAGCATGGGGCAGATGACACAGAAAGAGAAGTATTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAAGGCCCGAGAGCTGCATCCGGAGTACTACAAAAACTGCTGA diff --git a/tests/expected-results-large/blast.csv b/tests/expected-results-large/blast.csv index 95436d9..2c4fc32 100644 --- a/tests/expected-results-large/blast.csv +++ b/tests/expected-results-large/blast.csv @@ -1,117 +1,118 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,9386,9635,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,180,1,180,9540,9719,2.04e-69,259,100.000,180,plus,180 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,9497,1,9493,151,9632,0.0,13151,98.473,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG229-T41AG5AG81CA45GA54CG3CA3AGGA18TC32TC11AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA85AG143AG14GA38TC52AG146GA285GA25AG11TC47GA58AG11TG181GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,484,1,484,9236,9719,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,634,1,634,9086,9719,0.0,813,94.795,601,plus,14TCGAGC5GA1AG56GA21GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,9488,9579,2.15e-30,131,98.913,91,plus,18GC73 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9753,1,9689,1,9719,0.0,11990,93.264,9096,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC2-T6GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC32TC1AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA31CA36GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,1,616,9086,9719,0.0,760,92.283,586,plus,24AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,8446,666,9069,1323,9673,0.0,9611,90.161,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC2-T17AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG9TC4TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC46GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC13GA3AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 -MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9719,8140,882,8985,1584,9666,0.0,9469,91.032,7410,plus,6TC32TC59TC77GA5AG17CT17TA5AG29CT8GA32GT23CT6TA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT7GA11CT4CT3AG6AC4AG17GA11TG1TC5ATGAAG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA17AG41CT13AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG57AG7TC32GA11TC56CT69CT45CT39AG95AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA2GA9GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG10GA2TC23TC2AG2AG2AT4CT18CT3GA1CT18AG2TA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG11GA5AG35CT6AC1AG30TA71TC26AG61GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29CA18CG7AGCA22GT99AG92GA13GA14TC23GA32AG17AG2TC34GA31CA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14AT35AG25GA27CA29TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2AT21GT1GC24ACGA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACT6TC6CT4AG23AG23TCCA23GC7TC2-T12AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG33GA20GA10GAGA5GT2CT4GA23AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC2CT1GA2ACCT7TC4TC27TC4TC2TA2GCAC4TG26TA1TA14CT2TG5TC6CA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-4TG5CG20CTAG4CT5AG2-C-T-A4GAGA1CA1CT36AG6GA28CT11CT11CT5CT14TC34AT2-T-G-G7AG14TCGACTAG9AG10TA76CG6CG6AG1CTAT1CG2TG1GACT-G-A-T7TCAC2CT1AG2CGCT1-G-C-G-G-G-A-G-A-A-T-G3GA1AGTG5-G4AG2GA1CA12TC3GA3CG4GATG8AG9AG3CG8CT17GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-C-T-A-T-A-G-5TC2AG7TA5AGCT81GA5GTGA6ACTG16TC5AC6TC51TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC10GA3TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG39GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT10AT4TG2AG1-G-A-C1TCTA5AC10AGGA4GAGA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG69CA36GA46CT46AC5AG14AG8TA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGTAT4TC2ATAC10CG46GA30GA10GT18AT4TC20AGAG20AG37CT22TA7GA2GC28CA1GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG9TC7AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7TG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA16GA25AG1AC28TA13AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT3TC1AG16TA5AG21CT1GA16AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 -MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9719,846,40,881,1539,694,0.0,1076,94.563,800,minus,15CT14GA2GA23CT26CA22AC30AG2TC17AG38CT29GT17TC11AG23CT53CG35GA5AG1TG5GT20TCCT20TC69AGCT13AT8TC7CT17TG1CA75CT2TC29CT6CT31CT6TCTGGA23CT47AT-T-T-T-T12GATG21TC25 -MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9719,582,8404,8985,1,581,0.0,693,91.753,534,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA13AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT3TC1AG16TA5AG21CT1GA4GA11AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 -MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9719,9070,477,9480,577,9627,0.0,10903,92.381,8379,plus,25AG1-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T1AGTA23C-5TG2T-A-GCAT11TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9719,544,8946,9480,1,542,1.17e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9084,652,9689,652,9670,0.0,10957,92.459,8399,plus,15AG51AG25-T-G-A-G-T-A-C-G-C-C-A-A2TA71CTACAGGA17GA25GA6GA5CA38CT39AC17GT34GA29AG15GA25GC3GA51GA1GA5AC6GA4A-C-C-A-G-C-AGCT21AG8TC89AG11CT6CT119TG10AG35GA62TA83CT11AG23GA20TC71AG47TA5AG11GA26GA11TC5AG11AG2GT16CT13GA40AG1GT12TC5CT8TA7TC3AC1AG18AG1GA49CA1AT26AG12CT7GA22AG27GA13TC5ATGA15TC14ACAC7CA4CA12GA9AGAG35GA61CA77AG122TC8AG95CT5AG29AT8GA68CT11AT101CA20CTAG59GA82AG4AT16AG10AC36CT21TC9AG2AG19AG7TC52GT17CT2GA19CT15AC35AG8CT14CT8AG26AC5GA3GA32AG17TC1AG11GA76AG9GA95GA21GA16GA25GA3AG11AG12GA13AG38CT17AG47TC29AG7CT43AG2CA37TA20AG20TC17GA33AC21GA123GA29AT2CA59GA170CT11GA12GA7CT3AC17CA11GACA12AT21AG7AG4AG9CT8AG2GA17CA44CT2TA5GA71TC60GA14TA14CT26CA29GA73AC32TC68GC4CA1CA20AG3AG16AG6GT6AG14AG1AC20AG5TC16AT6CT3CT1GA43CT36GAAG22AG1CA35TC11AC14TG1TC1AT10TC1GT49TC4GA12AG8GA15CT19AG39GAAG12CA6AG3TC11GA27GA27GT23CT8GA18AG14TA9GT18CT2TC2-T33ACAG6CG10AG25AGTA26CT8GA13CA13CA9AT24CA4GC36AG6GA2TG3CA3AGGA9TC41TC4TC2TA2GC5TG26GACTCA21AT8TA31GA24AC3GT15TC20G-G-A-T-C-A-T-G-A-4TA11AG-T-G-G-A-G-A-T-G-G-G-G-G13TC51TC29AG7AC12CT34CT33TC21AG3GT5AT34AG87CG4CA1TG6AG1GT3GA3TA1AG3G-C-A-4GT1A-G-A-1TC5C-A-C-2AG2AGTC2TG1CGTA1ATCG2C-4C-C-A-C-T-2T-2TA1G-T-T-G-G-2GA2AG2GA19CT2CGTCGA12AG6AG4GA5TA3GACT20GA17GAAC2TC2AG5GA3AG1TC19CA79GA4GAATGA4AG1ACTG16AC5AC15GA47CA34AG5ATAC3AT4AG6AG7TC17TCGA9CA4GATA33TA2AC1CG3-C-C-A-G-A-G3GA11GA3TGAT1GA2GACT4GA1T-A-T-7GA1CT2AG4GA6CT4TA1CA3AGCT1AG1AG3CA4GA7ATAT2GA5GA6AGAC19-G-A-A1GT5GA6GA6GATGGC7GA18AGCT2TC1ACTATC39GATC22CTAT5AG1GAGCGTAT1TG6AGCA8GA2GA2GC6CA1AG1-G-A-C-A-C-A5AC10AG28GA34AT4CA6CA2CTGTACGA15TC5CT16GT3GAAG1G-C-T-3G-G-G-2CTAG1CGAT6CT19AG17CA15GA3CT40GA4CA13AG23TACA1CA5CT47GC5AG87AC28AG15GA44CA25CT4AC19AG13CT11TAGC1TG6CA2AC3TC18AC9GA12AG1AT5TC2ATGC9GA1CA8CA28CT1AG8CT12CT15GA4TA4CT11CT6AT47AG2AG26AC7CT30GA3AC26CTCA1GA3CA12CAAG17CT2AGCA6GA1TC4TC3AG3AC9TA3CT7AG13CATG32CT1GA49CT8CT2TC2GA11GT1GA30TC38AG10GT1TG1GA1GACAAG6TG10ACTG36AGGACT5AT4AG8TC2AG9TA5AG1AGGA28AG8AT14ATGA12TC18GA24-A-C-A-G-C-A4AC8AC4AG7GA5CA1A-A-A-4AG11AG2CT10GCGA11CT26CTTG44AC5TC9AG12TC12GA5AC24GA25AGCTTC4TA23TA24GT1GA1GA9ACGC6AG8CAGC1TA14AG6AT18AG4AG7CT2CG25CA5CT5AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 -MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,602,9088,9689,1,585,0.0,679,89.701,540,plus,8AC5TC8ACAG12TC12GA5AC24GA26CTTC4TA23TA26GA1GT7GA1ACGC2TC3AG8CAGC1TA14AG6AT6GA11AG4AG7CT2CG25CA5CT3GA1AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 -MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9719,9061,410,9377,577,9625,0.0,10733,91.855,8323,plus,25-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G3-G-G-A28AGCATC1GT1GA1CATG1-G-A-A-ATG2TA3TC1-G-A-G3AC2CT3-G1TC1TC1-G-G1AC2-GTG2AT2-T-G1GATGGC4CA2-G-C2CG3-CAGCACGTG1AGACAG4-C-T-G-G-TAG4-C-G-C-C3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC13GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9719,542,8845,9377,1,540,2.31e-175,613,90.037,488,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9719,9072,369,9381,577,9624,0.0,10860,92.262,8370,plus,25A-C-TG1ACACTCCT1CT3-T4G-1CT1C-C-C-2A-C-T-28A-G-3T-4TA8TGAG20GA29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 -MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9719,541,8850,9381,1,539,8.58e-176,615,90.203,488,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,9152,512,9583,577,9686,0.0,10851,91.882,8409,plus,24-A-G-A-C-C2-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27-G-G2T-3GATA1AG1TG1GA2A-T-C-C-C-T-C-T-2TA3TC4A-TGCACG3AT1CT1CG1A-A-T-29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,668,8973,9614,1,649,0.0,688,86.976,581,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,79,273,351,577,649,8.05e-10,64.0,78.481,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-CTCGCGTA27 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,81,405,485,577,649,5.83e-09,61.1,76.543,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-C-A-CTCGCGCA27 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,31,273,303,9662,9692,8.42e-04,44.0,96.774,30,plus,28TC2 -MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9719,31,405,435,9662,9692,8.42e-04,44.0,96.774,30,plus,28TC2 -MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9719,9112,34,9126,646,9679,0.0,10568,90.935,8286,plus,21AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC12AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG38AG7AG20AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA27AT30AG4TC50GA57TC9CT7GA17CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTAG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA7AC11CTCT12TC4CT2TC2-T17AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3T-1TC2-A2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2-A1GA1CACT1GTGC2GC1AC2AG1C-AG1CAAG2-G-G-GTG14TC1TA2TC11GT7AC8-T-A3-A3CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-T-2AG2T-C-T-AG3CGGACTCA4CT1ACTC4C-T-T-6AGTCAGAGTG1C-TG3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11G-A-A-G-G-T-1GA2G-A-A-7G-G-G-2AGAC4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10-A-A-A3-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT5AG8A-T-G-7TAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12A-A-G-C-A-A-CT5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG5CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC8A-C-C-C-T-A-G-A-T-1GT4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT8AG20CT8GA2AG2GT7TA11AC26CT8GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC27AG3AC1GTTG6CG2GA9C-A-G-8AG19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 -MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9719,598,8529,9126,1,594,0.0,670,89.632,536,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 -MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9719,33,1,33,702,670,1.52e-05,49.7,100.000,33,minus,33 -MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9719,9071,458,9461,577,9625,0.0,10898,92.382,8380,plus,25-G-A3-T-T-T3-T-C-A-G-T-G-T-G-G-A-A-A20C-G-1A-G-G-C-2TAAG17TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9719,542,8929,9461,1,540,8.47e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9719,9036,130,9032,649,9627,0.0,10320,90.317,8161,plus,18AG72-A-C-T-G-G-T-G-A-G-T-A-C-G-C-C-A-A-A-A-A47GA23CTACAG6GA31GA6GA29AG2GA75GT19GA7AG8TA13GATC20AG48AG20GAAG28TC1AG2GACT35GC53GA20AT2TC11AG17CA29GA38TC17AG2TC30TG22GT23GA2GA23CT2CT14GA47CT2CT47TC59TC77GA5AG14AG2CT17TA5AG29CT8GA32GT23CT3AGAC1GA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT19CT4CT3AG5GAAC4AG17GA11TG1TC5AT1AG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA8CA4AG3AG55AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG25GA31AG7AC32GA11TC56CT69CT5AG13AG25CT39AG83TA11AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA12GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG13TC23TC2AG2AG2AT4CT18CT3GA1CT18AG1TCTA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG8AT2TA5AG35CT8AG9AG52TC39TC26AG25TC35GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29TA18CG7AGCA10GA11GT99AG92GA13GA14TC23GA32AG13TC3AG2TC34GA30AGCA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14CT35AG25GA57TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2GT21GT1GC25GA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACTAT5TC2CT3CT4AG23AG23TCCA9CT13GC7TC2-T12AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG2GA30GA20GA11GA8CT4GA14GA8AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC1AGCT4ACCT7TC4TC7AG4GA14TC4TC2TA2GCAC4TG26TA1TA14CT2TG5TC6TA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-3GA6CG17GT2CTAG4CT5AG2-C-T-A5GA1CA1CT36AG35CT11CTCA10CT5CT14TC34AT2-T-G-G22TCGACTAG9AG10TA76CG6CG8GT9AGGACT4CA2TCAC2CT1AG2CGCT2TC-G-G-G2TA2-G1GT2-T-G-G-A1-A7AG2GA8TC5TC3GACT2CG4GACGAC7AG9AG3CG8CT9GA7GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-A-T-A-T-A-G-5TC2AG7TA2GT2AGCT51-T-T-G-T-G-C-C-C-C-G-G-C-T1-G-T-T-T-T-G-C-G-A-T-T-C-T-A-A-A-A-T-G-T-A-A-T-A-A-T-A-A-G-A-C-G-T-T-C-A-A-T-G-G-A-A-C-A-G-G-A-C-C-A-T-G-T-A-C-A-A-A-T-G-T-C-A-G-C-A-C-A45TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC14TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG3AC35GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT7TC2AT4TG2AG1-G-A-C1TCTA5AC10AGGA5GA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG29AG39CA36GA46CT46AC5AG14AG8CA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGT5TC2ATAC10CG46GA22CA7GA10GT18AT4TC20AGAG20AG60TA7GA2GC28CA1GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG17AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7CG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA16GA25AG1AC28TA9GA3AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT5AG2TG1AG11TA5AG21CT1GA16AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 -MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9719,543,8492,9032,1,542,4.15e-180,629,90.792,493,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA9GA3AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT5AG2TG1AG11TA5AG21CT1GA4GA11AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 -MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9719,150,1,129,782,633,2.35e-34,145,84.667,127,minus,23-T-T-T-T-T-G-G-C-G-T-A-C-T-C-A-C-C-A-G-T72TC12AG16-C4 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,9385,9634,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,180,1,180,9539,9718,2.04e-69,259,100.000,180,plus,180 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,9496,1,9493,151,9631,0.0,13155,98.484,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG270AG5AG81CA45GA54CG3CA3AGGA18TC44AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA24TCAC59AG143AG14GA38TC52AG146GA311AG11TC47GA58AG11TG181GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,484,1,484,9235,9718,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,634,1,634,9085,9718,0.0,816,94.953,602,plus,14TCGAGC5GA1AG78GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,9487,9578,2.15e-30,131,98.913,91,plus,18GC73 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9752,1,9689,1,9718,0.0,12000,93.294,9098,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC8GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC34AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA30TC37GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,1,616,9085,9718,0.0,763,92.441,587,plus,24AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,8445,666,9069,1323,9672,0.0,9616,90.172,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC19AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG14TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC16TCAC28GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC17AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9718,8139,882,8985,1584,9665,0.0,9479,91.068,7412,plus,6TC32TC59TC77GA5AG17CT17TA5AG29CT8GA32GT23CT6TA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT7GA11CT4CT3AG6AC4AG17GA11TG1TC5ATGAAG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA17AG41CT13AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG57AG7TC32GA11TC56CT69CT45CT39AG95AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA2GA9GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG10GA2TC23TC2AG2AG2AT4CT18CT3GA1CT18AG2TA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG11GA5AG35CT6AC1AG30TA71TC26AG61GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29CA18CG7AGCA22GT99AG92GA13GA14TC23GA32AG17AG2TC34GA31CA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14AT35AG25GA27CA29TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2AT21GT1GC24ACGA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACT6TC6CT4AG23AG23TCCA23GC7TC14AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG33GA20GA10GAGA5GT2CT4GA23AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC2CT1GA2ACCT7TC4TC32TC2TA2GCAC4TG26TA1TA14CT2TG5TC6CA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-4TG5CG20CTAG4CT5AG2-C-T-A4GAGA1CA1CT36AG6GA28CT11CT11CT5CT14TC34AT2-T-G-G7AG14TCGACTAG9AG10TA76CG6CG6AG1CTAT1CG2TG1GACT-G-A-T7TCAC2CT1AG2CGCT1-G-C-G-G-G-A-G-A-A-T-G3GA1AGTG5-G4AG2GA1CA12TC3GA3CG4GATG8AG9AG3CG8CT17GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-C-T-A-T-A-G-5TC2AG7TA5AGCT81GA5GTGA6ACTG16TC5AC6TC51TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC10GA3TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG39GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT10AT4TG2AG1-G-A-C1TCTA5AC10AGGA4GAGA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG69CA36GA46CT46AC5AG14AG8TA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGTAT4TC2ATAC10CG46GA30GA10GT18AT4TC20AGAG20AG37CT22TA7GA2GC27TC2GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG9TC7AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7TG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA42AG1AC28TA13AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT3TC1AG16TA5AG21CT1GA16AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 +MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9718,846,40,881,1539,694,0.0,1076,94.563,800,minus,15CT14GA2GA23CT26CA22AC30AG2TC17AG38CT29GT17TC11AG23CT53CG35GA5AG1TG5GT20TCCT20TC69AGCT13AT8TC7CT17TG1CA75CT2TC29CT6CT31CT6TCTGGA23CT47AT-T-T-T-T12GATG21TC25 +MN090376,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,8985,9718,582,8404,8985,1,581,0.0,693,91.753,534,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA13AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT3TC1AG16TA5AG21CT1GA4GA11AC1AG13AT15GT7TG19AG11G-10AGAC11AT22GC56AT22GA48AC31 +MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9718,9069,477,9480,577,9626,0.0,10913,92.414,8381,plus,25AG1-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T1AGTA23C-5TG2T-A-GCAT11TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115581.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9495,9718,544,8946,9480,1,542,1.17e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9083,652,9689,652,9669,0.0,10973,92.513,8403,plus,15AG51AG25-T-G-A-G-T-A-C-G-C-C-A-A2TA71CTACAGGA17GA25GA6GA5CA38CT39AC17GT34GA29AG15GA25GC3GA51GA1GA5AC6GA4A-C-C-A-G-C-AGCT21AG8TC89AG11CT6CT119TG10AG35GA62TA83CT11AG23GA20TC71AG47TA5AG11GA26GA11TC5AG11AG2GT16CT13GA40AG1GT12TC5CT8TA7TC3AC1AG18AG1GA49CA1AT26AG12CT7GA22AG27GA13TC5ATGA15TC14ACAC7CA4CA12GA9AGAG35GA61CA77AG122TC8AG95CT5AG29AT8GA68CT11AT101CA20CTAG59GA82AG4AT16AG10AC36CT21TC9AG2AG19AG7TC52GT17CT2GA19CT15AC35AG8CT14CT8AG26AC5GA3GA32AG17TC1AG11GA76AG9GA95GA21GA16GA25GA3AG11AG12GA13AG38CT17AG47TC29AG7CT43AG2CA37TA20AG20TC17GA33AC21GA123GA29AT2CA59GA170CT11GA12GA7CT3AC17CA11GACA12AT21AG7AG4AG9CT8AG2GA17CA44CT2TA5GA71TC60GA14TA14CT26CA29GA73AC32TC68GC4CA1CA20AG3AG16AG6GT6AG14AG1AC20AG5TC16AT6CT3CT1GA43CT36GAAG22AG1CA35TC11AC14TG1TC1AT10TC1GT49TC4GA12AG8GA15CT19AG39GAAG12CA6AG3TC11GA27GA27GT23CT8GA18AG14TA9GT18CT2TC35ACAG6CG10AG25AGTA26CT8GA13CA13CA9AT24CA4GC36AG6GA2TG3CA3AGGA9TC46TC2TA2GC5TG26GACTCA21AT8TA31GA24AC3GT15TC20G-G-A-T-C-A-T-G-A-4TA11AG-T-G-G-A-G-A-T-G-G-G-G-G13TC51TC29AG7AC12CT34CT33TC21AG3GT5AT34AG87CG4CA1TG6AG1GT3GA3TA1AG3G-C-A-4GT1A-G-A-1TC5C-A-C-2AG2AGTC2TG1CGTA1ATCG2C-4C-C-A-C-T-2T-2TA1G-T-T-G-G-2GA2AG2GA19CT2CGTCGA12AG6AG4GA5TA3GACT20GA17GAAC2TC2AG5GA3AG1TC19CA79GA4GAATGA4AG1ACTG16AC5AC15GA47CA34AG5ATAC3AT4AG6AG7TC17TCGA9CA4GATA33TA2AC1CG3-C-C-A-G-A-G3GA11GA3TGAT1GA2GACT4GA1T-A-T-7GA1CT2AG4GA6CT4TA1CA3AGCT1AG1AG3CA4GA7ATAT2GA5GA6AGAC19-G-A-A1GT5GA6GA6GATGGC7GA18AGCT2TC1ACTATC39GATC22CTAT5AG1GAGCGTAT1TG6AGCA8GA2GA2GC6CA1AG1-G-A-C-A-C-A5AC10AG28GA34AT4CA6CA2CTGTACGA15TC5CT16GT3GAAG1G-C-T-3G-G-G-2CTAG1CGAT6CT19AG17CA15GA3CT40GA4CA13AG23TACA1CA5CT47GC5AG87AC28AG15GA44CA25CT4AC19AG13CT11TAGC1TG6CA2AC3TC18AC9GA12AG1AT5TC2ATGC9GA1CA8CA28CT1AG8CT12CT15GA4TA4CT11CT6AT47AG2AG26AC7CT30GA3AC29GA3CA12CAAG17CT2AGCA6GA1TC4TC3AG3AC9TA3CT7AG13CATG32CT1GA49CT8CT2TC2GA11GT1GA30TC38AG10GT1TG1GA1GACAAG6TG10ACTG36AGGACT5AT4AG8TC2AG9TA5AG1AGGA28AG8AT14ATGA12TC18GA24-A-C-A-G-C-A4AC8AC4AG7GA5CA1A-A-A-4AG11AG2CT10GCGA11CT26CTTG44AC5TC9AG12TC12GA5AC50AGCTTC4TA23TA24GT1GA1GA9ACGC6AG8CAGC1TA14AG6AT18AG4AG7CT2CG25CA5CT5AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 +MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,602,9088,9689,1,585,0.0,679,89.701,540,plus,8AC5TC8ACAG12TC12GA5AC24GA26CTTC4TA23TA26GA1GT7GA1ACGC2TC3AG8CAGC1TA14AG6AT6GA11AG4AG7CT2CG25CA5CT3GA1AG3AC21ATTC5C-T-A-G-A-A-C-T-G-C-T-G-A-C-A-T-14TC2TG31G-6TC16AT21CTGC21CT22GT34GA84 +MK115690.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,160,1,159,9085,9244,4.40e-48,191,91.875,147,plus,8AC5TC9AG12TC12GA5AC50AGCTTC4TA19-T3TA14GT6 +MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9718,9060,410,9377,577,9624,0.0,10743,91.887,8325,plus,25-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G3-G-G-A28AGCATC1GT1GA1CATG1-G-A-A-ATG2TA3TC1-G-A-G3AC2CT3-G1TC1TC1-G-G1AC2-GTG2AT2-T-G1GATGGC4CA2-G-C2CG3-CAGCACGTG1AGACAG4-C-T-G-G-TAG4-C-G-C-C3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC39AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115571.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9394,9718,542,8845,9377,1,540,2.31e-175,613,90.037,488,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9718,9071,369,9381,577,9623,0.0,10870,92.294,8372,plus,25A-C-TG1ACACTCCT1CT3-T4G-1CT1C-C-C-2A-C-T-28A-G-3T-4TA8TGAG20GA29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 +MK115514.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9382,9718,541,8850,9381,1,539,8.58e-176,615,90.203,488,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT81CT4 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,9151,512,9583,577,9685,0.0,10861,91.913,8411,plus,24-A-G-A-C-C2-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27-G-G2T-3GATA1AG1TG1GA2A-T-C-C-C-T-C-T-2TA3TC4A-TGCACG3AT1CT1CG1A-A-T-29AG23-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG33CT31CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA4AG2CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT8GC1TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT4TG1TA-T-G-A15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T12GA7TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG11AG2AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5C-2TA1A-A-16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,668,8973,9614,1,649,0.0,688,86.976,581,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC25A-T-C-T-C-T-A-G-C-A-G-1G-G-G-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,79,273,351,577,649,8.05e-10,64.0,78.481,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-CTCGCGTA27 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,81,405,485,577,649,5.83e-09,61.1,76.543,62,plus,28TC2GTGT2AGCTTC2AT1A-T-C-C-C-T-C-A-CTCGCGCA27 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,31,273,303,9661,9691,8.42e-04,44.0,96.774,30,plus,28TC2 +MK115488.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9623,9718,31,405,435,9661,9691,8.42e-04,44.0,96.774,30,plus,28TC2 +MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9718,9111,34,9126,646,9678,0.0,10578,90.967,8288,plus,21AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC12AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG38AG7AG20AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA27AT30AG4TC50GA57TC9CT7GA17CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTAG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA7AC11CTCT12TC4CT2TC19AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG13T-1TC2-A2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2-A1GA1CACT1GTGC2GC1AC2AG1C-AG1CAAG2-G-G-GTG14TC1TA2TC11GT7AC8-T-A3-A3CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-T-2AG2T-C-T-AG3CGGACTCA4CT1ACTC4C-T-T-6AGTCAGAGTG1C-TG3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11G-A-A-G-G-T-1GA2G-A-A-7G-G-G-2AGAC4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10-A-A-A3-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT5AG8A-T-G-7TAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12A-A-G-C-A-A-CT5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG5CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC8A-C-C-C-T-A-G-A-T-1GT4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT8AG20CT8GA2AG2GT7TA11AC27AC7GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC27AG3AC1GTTG6CG2GA9C-A-G-8AG19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 +MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9718,598,8529,9126,1,594,0.0,670,89.632,536,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT99CAAGCTTG1ATATG-G-4C-41 +MK115030.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9126,9718,33,1,33,702,670,1.52e-05,49.7,100.000,33,minus,33 +MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9718,9070,458,9461,577,9624,0.0,10908,92.415,8382,plus,25-G-A3-T-T-T3-T-C-A-G-T-G-T-G-G-A-A-A20C-G-1A-G-G-C-2TAAG17TGAG20GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115498.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9461,9718,542,8929,9461,1,540,8.47e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9718,9035,130,9032,649,9626,0.0,10330,90.349,8163,plus,18AG72-A-C-T-G-G-T-G-A-G-T-A-C-G-C-C-A-A-A-A-A47GA23CTACAG6GA31GA6GA29AG2GA75GT19GA7AG8TA13GATC20AG48AG20GAAG28TC1AG2GACT35GC53GA20AT2TC11AG17CA29GA38TC17AG2TC30TG22GT23GA2GA23CT2CT14GA47CT2CT47TC59TC77GA5AG14AG2CT17TA5AG29CT8GA32GT23CT3AGAC1GA2GA1GA10AG14GA12GT34TC29GA60AT14AG12CT19CT4CT3AG5GAAC4AG17GA11TG1TC5AT1AG13TCTC23CA7AG2CT3CT1GATA9AGAG20TC1AC6GA3GA54GA8CA4AG3AG55AG16-C3G-7TC30AG19TC35TC20TC8AG40GA43AGCT11ACGA2AG25GA31AG7AC32GA11TC56CT69CT5AG13AG25CT39AG83TA11AC63GA7AG19AG6GATC40TC51CGATAG8GA23TC8AG8AG2GA23TC20GA11AC9GA4GA2GA12GA43GA2AG2CT36AT40TC38CTTC24CTAG54GA31CT10GA3AG5TA5AG12TA13AG38CT38AG12AG13TC23TC2AG2AG2AT4CT18CT3GA1CT18AG1TCTA44CT19AG53GA12AC4CT32AG6CA16CT32GA30TG10AG2GA11GA14AG8AT2TA5AG35CT8AG9AG52TC39TC26AG25TC35GA5AG14CT5CT28CA12AT9CACG3CT6AG2AGAC1GA1AG4AG18AG2GAGA4AG2AG8CA29TA18CG7AGCA10GA11GT99AG92GA13GA14TC23GA32AG13TC3AG2TC34GA30AGCA1TCGA8CT9TC7AGCT2AGAT9GA13GT22ACGCAT38A-3GTA-G-6CT1AG3GA1GA14CT35AG25GA57TC3AG1TC11AC12CA1AG3AT10TC1GT6TC29TC14GA2GA12AGTC10CA9GA2GT21GT1GC25GA9GA17AG6TC19AG8AG8AG1GAAT11GA2CT9GACTAT5TC2CT3CT4AG23AG23TCCA9CT13GC7TC14AG4AGGA2CT5GA6AG2CATC1ACCGCA2TG2AG2GA30GA20GA11GA8CT4GA14GA8AT8CAGACGGTAT2CT3TA9GC46AG3CA4GA1TC1AGCT4ACCT7TC4TC7AG4GA19TC2TA2GCAC4TG26TA1TA14CT2TG5TC6TA20ATGT8AGGA1GA10AT2CA8AC3GT36G-G-A-C-C-A-4GAAT2T-G-G-4CA2CT12AGA-C-C-A-T-G-C-T-C-A-T-T-3GA6CG17GT2CTAG4CT5AG2-C-T-A5GA1CA1CT36AG35CT11CTCA10CT5CT14TC34AT2-T-G-G22TCGACTAG9AG10TA76CG6CG8GT9AGGACT4CA2TCAC2CT1AG2CGCT2TC-G-G-G2TA2-G1GT2-T-G-G-A1-A7AG2GA8TC5TC3GACT2CG4GACGAC7AG9AG3CG8CT9GA7GA2GA3AC3TAAG1GTGA6AC12T-A-C-C-A-G-A-T-A-T-A-G-5TC2AG7TA2GT2AGCT51-T-T-G-T-G-C-C-C-C-G-G-C-T1-G-T-T-T-T-G-C-G-A-T-T-C-T-A-A-A-A-T-G-T-A-A-T-A-A-T-A-A-G-A-C-G-T-T-C-A-A-T-G-G-A-A-C-A-G-G-A-C-C-A-T-G-T-A-C-A-A-A-T-G-T-C-A-G-C-A-C-A45TC24GA3TG15AGATAC6TA1TGAG3GA4CA16AGTC1AG3GAAC1AT31TC14TA2AC1AG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA4AG3AC35GA1GC9AC8GAAGTC8GA9-G-G3ATGA1GT1GA-A6GA7CG23GA7TC16AG23AT26ATAT2GA2CG3AT-T6ACA-2GAT-A-C-3AGGT7TC2AT4TG2AG1-G-A-C1TCTA5AC10AGGA5GA6GA14GA46TA23AG3CT2CATC21T-G-A-2CAGT2T-A-A-C-A-C-1AT1TC2AG29AG39CA36GA46CT46AC5AG14AG8CA20AG20AG21AC7GA36GA10AG11TA47CT9AGAC13AGGC16ATAC4AGGATATC1CG9AC3TC10CG7AC1AG7GA11GAAGGCGT5TC2ATAC10CG46GA22CA7GA10GT18AT4TC20AGAG20AG60TA7GA2GC27TC2GA35GT2AGCA4CT1CA1TC4TC3AGAG2AC9TA3CT13TG17AG25GA5GAGT39GA17GA11CT23CT11CT36TG11TG1GA3AG2AGTC2TG10ACTG11CG25GACT10AG5AT4TAAG1TGCG6CA3AG2GT1GAGT3GA6GA1ATAG23CG14GA4AG25GA9TACA9AG7CG6AC8AC12GA7A-G-G-6GA3AG2AG8CT7GC27AT7GC49TC5TC8CAAG25GA5AC7GA42AG1AC28TA9GA3AG1GT2AG5GTGA1TGGA5AG6CA1GA8GA3AC2TG17AG2AT12CT5AG2TG1AG11TA5AG21CT1GA16AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 +MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9718,543,8492,9032,1,542,4.15e-180,629,90.792,493,plus,8TC5TC9AG25GA5AC7GA16GA27AC28TA9GA3AG1GT2AG6GA1TGGT5AG1GA4CATCGA8GA3AC2TG17AG2AT6GA5CT5AG2TG1AG11TA5AG21CT1GA4GA11AC1AG13AT15GT7TG2-A-C27G-10AGAC11AT22GC56AT22GA41 +MK115211.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9032,9718,150,1,129,782,633,2.35e-34,145,84.667,127,minus,23-T-T-T-T-T-G-G-C-G-T-A-C-T-C-A-C-C-A-G-T72TC12AG16-C4 MK115158.1,Ref.47_BF.ES.08.P1942.GQ372987,0,9143,8926,8919,162,9029,68,8923,0.0,9530,87.790,7830,plus,27A-C-C-T-2T-A-2TCAC2GA1TG1CGCACA1CGCT1AG1T-C-TA1TC3CGTA38AT1AG21-C-T-G-G-T-G-A-G-T3-C-C-A-A-A-A-A-T-T-T-T43GA20AG2CT1AG6GA20GA9CAAC6GA2AG26AG2GA11ATGC82GA7AG4TC8AG8GATC20GA3AC2GTAG25CT2GA11AG21AGCT6A-G-C-10CA9GA37AGTCGC8AC3GA8GC1CT2AT26GA2AG2AG8GA38CA12GTCG15GA5GC3CT4CT23TC9TC7AC2TC2CT23TC5GA17GA2GT2TCGC16AG5GT11CT5AT5CT17GA6GCGA11AGTC2TC6AG7AG5AT5CT11AC5GA29TC3AGCT7CT9GA6AG5GA14CT5AG3CA6AT4AGCTTC18TA7GT35GA3GT1AG32AG2TA3GCCAAG32GA11AG11GA14GA16TC4AGACCT3GACA1TGCT1GA1GA19TA4AG4AG8GT2TC19AG17GA23GA12AG8GA20TC2TC5GA8AT17CT9CAAG18CT4CTTC2AG1GA3AGAC4AG11AG4ACGA8CGAG1TG5GA2AGAG2A-C-A-5TC2TC4AC9GA1CA2TA2A-C-C-3AG3AG2CT3-C-C-CAT1GATG9AG21TC12GAGAAG7GA2AGCA1AG38GA8AC2GA1GA1CT1AG7GA6GA40AG12GA3-A3G-14CA1TG21AG19TC26GA8TC47AG22GAAG2TC14GA2AG22CT6TC4ACGA23TC36AG7AC20TA11GA26GA11CT2CT5AG17AG2CT2CT5GA27CT1GA8TA21CT2GT2AG4CA8AG101CT5TC8AG1GA24AG11GA2TG2AC63GA22GATC4GA6TC4CT32AC2TC20CA30CGATAG4CA3GA2AG4GA15TC8AG11GA23TC17GA2GA5TC1AG3AC5AG3GA7GA8ACGA14GA4AG32CTCT13GA5AG15AT40TC17TC5AG14CTTC22AGAT10TC16AG3AG24GA25AG2GA2CT20TA4AG3AG9TA13AC14TC32TC2CTTC4GA2AG17AG50TC2AG2AG2AT4CT18CT3GA1CT1GA9AG6AG19AC26TC1AT9GA41AG20GA14AG2CT8GA30CA1AC18GT22AG5GA26CT3TG10AG2GA11GA5AG8GA11TA16GA9AG8TC5CT8AC8AG11AG28TA52TC26AG22AG2TC35GA5AG49CA22CACG3CT8TC1AC1GA25AG3GA4AG2AG38TA11GA5AGCG7AGCA14GA7GT26AG34AG37AG20AC73TC3CG22TA2TC11GA8AG2AC8TC8CA11AG17AG2TA34GA10AG19AG2TAGA14AT16AC4GAGA3GA2TC1GAGAGAGA5GTTC3AC9AT9AG7GA6TC3GA13AW4GAAG1GA3GAGACA2GA1CT7GA14CT3CA7AG23AG21AC1AGAG3GAAG5CG6GA9AG3AG11AG6CA1GA9AG25AGCA25TC9GA1AC17TC14GA2GA2CT10TC10CG1ATCA4AG1GA1AGGC6AG14GCACGA4CTGTGAAGCT1GRARGA2TC9GA9GA44AG8AG10GAAT8TC2GA2CT9GC7TC2CT3CT1GA14TCGA1AC2TC5AG10CAAG5GT6CA7AG2TG8AT2GAGC7TC14AG2TCCA1GT2CT4GAGA9CA2ACCGCA2TG6GA29GA20GA2TC17CT4GATA2CT8AG1AGGA7AT8CAGACGGTAT6TA54GR1AC8GAAGTCAGAGCT4ACCT7TA4TC7AG10TC1CT13CT5AG18TC11TGTCTA3AT13TG33ATGT4CG3AGGA1GA1AG2GT1CT1GAGAAT2CA4TC38TC2AG2GA2CT11GAGT4CACA1CG5GA1TG4AC1CT1AT5AC2TG2GAGT2GTGAG-C-C-A-C-C-3CA2C-T-T-G-G-G-A-3C-4A-C-3TA2TA1-T1AT3GA1CG1CT72CT2AG8CT7TC3CT5CT14TC30GA1AGGTAT3-G-A-A21TCGACTAG8TC23GA8CT41CA5CT8TC5CT4CA1GA1-T-A-C-T2-C-A-C-C-A-C-T-A-A2-C-T-A-G-C1AT5GACT1CG15CT2TC5TC3GACT6ACGCCA2TCAG4A-T-A-A-2TA1CA2AG1-G1CG18GAAC11AG3A-3A-1GA2-C-A2TC2TA2CT2C-T-A-T-A-A-3CT2AC13AG7TA5AGCT12CT9GA37GA26GT6AC1TG16TC4GA7TC29AG18CT2TC13TC10GA4GA2GA4TC2AG3AC5TA4TAAG1CT1GA3TACA3CG12AG2AG2CT3AT2GA2GAAGAC10CT7AGAG27AG8GC1GAAG1CT18CT9GA30GA13GA1GC7AG1AC7TCGAAGTA6AG1GA11AC1GAGTGA1GA14CT23GA11CT1GC6TC3AG29CTAC15TA3AG1TG1GA1AGCA4GAGAATGA1AT1AC2GAT-A-C-2GA1GT6AGTCAT4AT1T-1AC1TC1T-T-10CA6GA5GA6GA5AT47CT1AC4GATC14TC8AGCA2CT2CG18GA2AGTAG-3CA1G-A-1AG1C-A-C-2CG3AG1TC11GA7GA6GAAG39CA17GA18GA19GC17AT1AT6CT46AG3AG1AGAG13AG7AT21AG12TC7AG29GA47AG11TA12CA2CA26CTTA13AGAC14GC3TC12ATAC1CT-A3G-1TC1TG2CT5TG35CT9GAAGGT10AG8AC2AT7AG40TC11TC7CA13AT4GC23TC21AG4TA15AG1TAGA34TC8AG2GA2TC7TA2TA6CTGC21AG8GA34AG3AGCA1TCAG3CAAGTC12AC8GA7GA10TG41TC7GAGTAT30GCCT6GA2TC8TC5GA11CT20TCGA1CT8CT2CTGA7CA4CT21GATA9TCAT8ATAGTC1TGTG7AG2AC12CG18GA11GA13GAGA2TAAG1TGCG6CA3AG1GAGTGA1GT3GA6GA1AT14GA6GA1TC1ACGT3GACT6TA5AG7CTAC11-A6A-8TACA9AG3TC3CG7CT3GC4TC1GTTG18G-A-A-5GT2AG5GA2TC38AT12GT1AC9CTAT39CT3CAAGAGCA10TG11GA5CT3AC7GA2CA39AG1AC2AG6CT10AG17GA3AG1GT2AC8TG13CA9GAGA5ATTG4TC7TCGA3AG3GA5GA5CG2CTTGCA3GC8GATC1AGGA16CA1GA8TCCTCAGATG5GA9AC13CT6AG10GT24GA2AG10AGGA6CT3AGAC31AG2 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,9386,125,9411,380,9719,0.0,10743,90.550,8499,plus,41GC19CT1CT3TC53GA104AC10CT37CT11TGAGGA11AC37AG22CT12-A-A2TA62CA9AC7GA38GA44GA29GA8GA23GA8AG19AG8TA7AG5GATC3TC5CT2AG14TGGA20CT2AG1TC35GA27AC6GA4A-G-C-A-G-T-C-A-A-30CAATTC15TC7TCCA58CA2GA2AG80GA57TG10AG59GA39CA47AC4GA31TC30AG5TC8TC47AG62CT3CT10AG8AG38GA2GA6AG4CT2AG8CT22CT4G-G-T-GAGA1GT2AG3AC14AG19GA4AGCACT1AG32CATC3TC68CT2CTTA28AG12CT22CT2CT4AG41TC5AT10GA24CT18CT2CATA9AGAG29GA84AG60AG4CT40AG44AC31TC8AG20AG80AG56CA20GA2TC17GA17GA8AG14TC5GA59AG20CT8TC9AGGA6AG28CTTA14CA8GA50TC14GA11AG35CT17AG2CT22AG10GA5GA5AG1CG6GC1GA18TC19GA20TC11CT92AG26TCGC15AG21GA3GA1TC2GA14GA3AC26TC68GA28TC8CA44GA10CTAG29GA8AG5TG9GA7GA9GA12TC11GA1TC1AG8GA2AG22TCGA41CT1GA15AG47TC23TC2AG9ATAT22GA1CT8GA9AG2CA2TC41CT19AG65CTAC1GA50GA8CT3AG61AT12AG10GA20GA2AT2TA14TC10AG22AC1AG8GA11GA3AG31GA72AG16CT14GA2CT26GA20CT3AC1CT31TC9AT2TC5TC12AG1CTAG4AG2CT1AG9CT8AG2TAGA1TC8GA38GA124AG4TA17AG35CT56GA13GA14GC44AC2CA8AG100CT20AG5AGAG8AG7GT4CT5CT12AC48AG57CT37AG17GACA21AC4CT2TC5TC11AC12CA1AG3AT10TC1GT6TC5TG38GA6CT12TC4GA2GA34CTGA3GA29GA5TC14AG6TC11GA7AG19GAGT24GAATAT9AG7AG26CT14AG1GA15AT9TC1AG8TC2-T17AGCA8GA6AG1-T3-C-G-A-C-A7AG14CA14GA2AG28GAGA3CG6AC21CT20CT4CT2AC3GA1GC31CA5AC5GA2CG3CA2GAAGGA9TC8TC1CT5CT4AG19TC7TA2GCACGA3TGCT23TC1GACT22AT8CA2TA4GA17GA4AGGA11AG6AG5AC3GTTA32CA2GA2TACAAT1GTAC2AC1-C4CG-G2CA1CGTGTGAG-G12GA2TA10AG24-G-A2CA1-T37AG2TA17CT33AG44GA17CT3AT17AT3TC3GT1AG6AG7GA57CATACA9TC7CT1CG6TG9GTCTTG2CG1T-C-1CTCG1GTC-7ACTC1GA3A-G-A-2AGGT1AGGC1A-A-6AT1T-1CT1TA4G-G-A-G-A-C-9AG23GC1CGTCTA7GA2CA1AG4TGCTTG6CG2CTGA4CT10GA6GA1GAGA3AC7GA1G-A-C-1AG3AC2ACTC2TC4GA5TC19GA1CT8TC20TG5CT2TC38GA13ACAG22AC35AGAG2TA5GA5CT17TC17AG3AG1GA10ATAC9AG22GA8GC3CT5CG40GA2ACAC4GC-C-A-G-A-G-A13TC1AT2TGAT1GA3CT4CA1A-A-T-7GA4AG3AC10CT15GA9CAAC8GA7TC2CGACCA8AG1GA2GA1-T-T2-A-A-A-T4GA3CA11CGTCCA27GA1TC16AG23AT5AC4AG15CTCTA-C-G-14AGT-A-A-16GA8-G-G-A-A-G-T-G-A-C1TC6AC5GA18GA6GT7GA7CA24CAAGAT11TA27CT2GATCTA11AT1TA2AG2CA2GA4ATGCC-A-A-5CT60GA83GAC-T-G-6AT11CT34GC3GA5TC11AG6TA21AG12CT22GA35AG15CA4AG18CA16AG29CT9AG13CTAG15GA4TCATTG3GC1TG8CTAC3TC18AC1AG7GA11GA8TC2AT11AG7GA8GA4TAAG12CT5TGCA3GA5GA8CTCT16TC27AT26AG58CT8GA2AG2GT7CA2GT4GA4AG22AG3CA7GA9AG17ACGA1GT10CATC4TC3CG6TA13AG2AG25AG13AC11GATC4GA8AC49GA5CT12AC14AG1CT11CT8TC26AGAG1CT4GA10AG2AG4GT6TA2ACTG12GA17TG6GACT19AC2AG10AGGT4GT1GAGT10GA12AG5AGGA3AG16GTGA28CA3TC29CGACGT6CG3AC24AG5AG5AG2CT10GC3CT11GA26GA3AC1GT52AGGA29TC25GA3AG2TC42GT6TA4-C4-A-C-C-A2-T1TA3CA1-A1CATA1TA1GATGGATA2CGTG1TCGAGA3CATG-G5TA1CA1-C-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA3AG1AT-G-G2CGTA1-C-C-G-G-A-G-A-G-A-G-A-A-G-T-G-T3C-5CA1CGCTCTGTAG4GCGCAG3-A1AC1ATGTCTGC1-T-C1AC2AG1ACAC1CG4GCAT1-C3TC-G-G-A-G-T-A2CTGC1CA1CA1GC-T-G-C-T3-A3-A7GA-C-A2CG1-A-C-T-T-T-C3ATCGAG1CG1-C-T-T-T-C-C2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,635,8840,9411,1,634,9.31e-121,432,76.535,486,plus,23ACAGGA29TC25GA3AG2TC18GA23GT6TA4-C4-A-C-C-A-GGT2TA3CA1-ATGCATA3-A1TAGATGGA1CGTC1TAGAGCTA2CGTG5TA1-A2-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA5-T-G-G-A-T-G-A-C-C-C-G-G-A-G-A-G-A-G2TGCTTGCT3C-5CA1CGCTCTGTAG4-C-C-G-C-C-T-A1GC1-T-T-T1CA1GC1-C1AT1-G-C-C3AG2-C1AGGC1AT2AG3GT1GCAT2TACATGCAGAACCT2AT1GAACCA3-A7-A-C-A-A-G-G2-C-T-T-T-C-C2-T1CG1CG2-TATGT1AC2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,255,125,379,9465,9719,5.83e-95,346,97.255,248,plus,41GC19CT1CT3TC53GA104AC10CT17 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,211,8973,9182,544,749,1.01e-65,249,92.417,195,plus,62AC10CT49TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,151,1,150,604,749,4.57e-39,161,88.742,134,plus,2AC10CT37CT11TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 -MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9719,91,8973,9063,9629,9719,9.52e-29,126,97.802,89,plus,62AC10CT17 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,9377,104,9441,402,9683,0.0,9753,86.765,8136,plus,19GC21CT24GA78TC55GA1TC1A-A-AT1CT1GA2C-2AGCTCGAT1A-2GA1CACT1ATGC37TGAGGA8AG2AC49AGAG22-A-A-A1TA11AG15AG4AG20GA3AG1AG12AC3AG3GA7AG10AG2AG15GA17AG8AG3AG43GA8AG3GA3TC1AG1AG25AG37CA10AG3AG7AG6TGGA13AG5GT8AGGA4AG26GA11GA12AG2AC4ACGAGACT3AGCT3TC7TA16CA1AC2AG8AG37AGAG17AG2AG17AG53TC14AGAG1TGAG4CT8TC15AG2GATC9AG13AGAG6TG1AG15AG22AG10AGAGAG14AG29AG3AG7CA20AG2AG1GA13AGAG5TC2AG3CT15AG22TC1AG7AGGA3AG1GA5AG25AG13TC8AG8AT5AG1AG10AG7AG10AG5GA5AG2TC11AG17AG8AG32AGAGAG4AG2AG13AG4AG6AG19CT4GAGA1GT4CT1AC26AG13CACT6AG21AGAG5TC5AG8AG8AG6AG7AG5AG1AG4AG3AG14AG4CT3AG20AGAG3AG12CT4AG10AG3C-T-2C-C-T-C-A-A-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-6AG9AG2TC1-G-G-G1AT3AGGA11TC14AC1AG11GA9CT13AG20AC17AG1AG1AG10AG5TC5AG31CA2AGGAAG7AG3AG2AG16AG1AGAG5AG2AG19AG5AT3GA3CT9TCAT1CTAG4CT9AG7GA30AG20CA2AG8CT13CT2TC8AG24AG7CT19AG6AG41AG2AG5AG3AGAG16AG28GA20TCGA1CT7AG2AG32AG9TC4AGAG3AG8AG1TA11TC3AGAG1CT19CA8AG5AG30AG9AG3AG42AGAG15TC14AGAG3AG4AG34GA3CT16GAACCA30AG15AG17AG4AG12GA2AG4AG5GA8AGAT6AGAGAG2TC19GA2CT11CT10AG4AG1GT41AG14AC2TC1AG27AGAG1AG10AG15TCGC2AGAG9GA1AG12GA7AG1AG11TC11GA44AG13TA9AG3CTAG12GT4GA15CA10AGAG1AGGC4TC2GA21AG16AG7AGGA13CT2AGAG8TC14GA11AG15TA10TC10AGAGAG3GA14GA1TC1AG11AG7AGAG7AG9TG16AG3CT3AG3AGAG8CT2CT22AG12AG12AG2AG23AGAG9TC1AGAG2TG1AC5CT1AG8AG11GA1CT3AG20AC3AC18AG5AG8CA3CT7CT5AG5AG2GACT28GA9AGAGGA21AC21GA12AG15AG4AG5CT7AGAG2GA5CA6AG5AGAG1AG10GA3AG5CT11AG6AG19AGAG6AT2AG8AT2CA3AG1AG16AGAG3AG11AG10AG6AG47AGAG6TC6AG1GA20TA8GA22AG4AG7AG21AG19GT11GA3AG4AG11CT3AC8CT5AG28AT9CA11AG2AGAC3AG2GT1AG11AG2AG3AGAGAG9AG6AG1TA25AG7AG7AG5TA18AG4AG4AG10AG66AGAG2AG10AG30AC5GA43AG11AG10GA9AG18TC15AGAG21CT35AG7AG7AGAG13AG31AG28TC11AG5AGAG6CT1AG1AGAG2AG1GTCT9CT2TC2CT4CG1AC28TC11AG1GA9AG16AGAG19AG12AG2CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT39AG3AG23AG19GA26AT1AC12AG7AG21AG9AGAG6TC9AG18AG10GAAT17CT5AGCACTAT5AC2ATAGAG1CT2AG1AG3TC17AGAGAG9AG2AG4AG27AC10TC2-T10AGAG5AGCA15AG2GATC2TGGA2AG2AG12AG13AC14AG23GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT11AG2AG9TC7TA2ACACGA3TG26GACT20AG1AT8GAGT4AG6AG27TC2AGAT5AG5AC3GT1AG28CT3-G-G-A-G3GT5GC1ACG-A-A-4CGAGGACG1C-1TG1TGAG2AG2AG2AGAG5GC9AGAG22GA1GA5TA4AGAG16AG11AGAG1GAAG2TA4ACTC11CT32AG13AG30TC8TA7AT4AGAT21TC4AG7AG10CA22AG6AG22CT6GA16CG6TG11AG2AG3AG5GAT-A-G-G-1AT1TC3ATCAAGAT1TG2TG1AGTGCGTACG5A-A-C-4AGCG1AGT-A-C-4AG1AG3AT1T-G-1CA20CG4GAAGGC7AG3AG4GAAG12CT17GA1CA2GA11AT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG3AG7AG8GA5ATGA2GA3TC7AG5AG9ACGA27AG7AG8GA21AG1TC2CT9AG2AG2AG5CA9ATAC8AG6AG6ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C2AGAG7AT2TGAT1GA3CT1AG2CA1G-A-T-5AG1GA4AG20CT3-A3ACCA1GA2TG3G-1GA9GACAAC1AG4TC1GAAGAC7AGGA3AC5AG4AT26AC3AG3AG4ACTC8AT19AG3AG18CTAT6GA18A-A-2G-7AT3AT1CG1-G2-C-T-G2CGAG1-T-C2CA5AC1AG2-G-G2TG-T-G-A-C-A-C-A5AC5GA20CA4GT7GA5AG22TC6AGAGGAACTA6GA2CT17AG2AGAC14AG2AG3CAAT1CGTC2TC1GA1AG1AGGTACAC4CT10AG3AG1AG2AG6AG8AG21CT17GA6AGAG19CA1AG4AG3AG21AG1AGAG3C-G-T-8AT7CTAG7AGAG2AG16AG8GC3CA10AG5AG29AG12CT6AG22AC18AGAG8AG15GA5TG4AG12CA1AG15AGAG6AGAG8AG20AG9AG4AG6AG3CT9T-A-1AT1TG1CA2TGCA1ATAT1-G-A2AC3TC5AG4CG3AG13CA1AC10AGGCAT5TC2ATAC4CA2AG12TA3AG2GAAG11AC10AG3CT5CA4AG4AG5AG5AG5GATC8AT5AG1AG10AT25AG3AG6AG4AG11TC25AG5CT11AG2GT7TA12AG2AGAG4AC12AG18AG1AG12GA8GTATAC9CATCAG3TC3AGCG4CT4AGAG5CT4AGAG11TC13AG3AG1AG18GACATC2AG2CT4CG2AC4AG4AG2AG1AGAG2AGAG2GAAGTC6GA2CT1AG2AG2GA6GA7AGAG1TG37AG3TC3TC2CA11AGAG1AG7AGAG12AGGT4AGAG1AGTC1AT1CT6TA3TG14AGGA8AG5AG4AG1GACT5AT4AG2AGAG9AG10TA2AG2GACT1AG3AG4GA6AGAG8A-G-A-A-A-3T-T-A-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-A-G-A-A-A-G-A-2AG17CA2AG3AGAG17TC1AG6TC2AG23TG2AG4TC16AG18AG2AG2AG2AG2CT10GC6AG26AG6TG2AG47TC1GC5GA11AT9TC5GA1TC14AC13GA3AG14AG12AT24TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG11AG7AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,598,8845,9441,1,598,0.0,659,88.629,530,plus,14TC1GC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA5AT24TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG11AG1GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,201,104,304,9487,9687,2.55e-74,278,98.010,197,plus,19GC21CT24GA78TC55 -MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9719,111,1,111,627,736,2.52e-31,135,92.793,103,plus,40TGAGGA8AG2AC45C-1AC3TG4 -MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9719,9078,150,9207,636,9627,0.0,9749,87.905,7980,plus,31AG41-A23CG21GA3TA38TG20CG3AG8AC3AG10TCAGCGCT9AGAG16GA17AG30CT2CT14GATA13CT2GA5TA2AG15GT50GATC9CT2AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC11AG8AGCG1ACTA24AG10AG28AG18CT8AG41AG1AG20GA11AG11TG2GA10AG7TG19CG22AG9AG20CT24AG3AG7CA28CT20AGAG1GACT4CT24GATC7TC14AG7AG10AG3TC11AG16AGGA2TC8GT8TG10AG18AG14TC14CT14AG8AG6TC32AG13CT41GT5CTTA7AGGA4AGGA12AG14AT28AG1AG10AG17AG6AG7AGAG6AG8AG23AG6C-1G-A-C-T-A-A-G-A-C-13AG7TC9CT15AG9CT26GA4CA14TC2AG2AT4GA5GA4TC15AC3AT4CA1AG15GA10AG20AC1ACAG1ACTA7AG5AG11AG47AG1AG11AG2AG16AGAGAGAG5AG2AG29GA3CT9TC30AG10GA2AT12AG16CT3CA2AG22CT2TC8AG21TC7AG3AG6GA36GA6AG11GA4AG2AG9AGAG7AT8AG7GA8TC44AG1AG16CA19AT10AGAG9CT2AG49AG5AG23TC5CTAG10AG23CT15GA6AGAGGA3AG25AG3AG4AG55GAGC31AG15AG18AG6CT14AG2AG17AG5AG5CT14GA12AG10TC4AG3AGAG24AG16CGAT9CA10AG27AGAG1AG2GA7AG6CT5CT2TC4AG11AG46GA72CTAG33GA11AG2ACGA2AG5AG44AGGA13CT3AG26GA24GA2CATC4GACG12AGAG22AG2TC8AG7AG1AG3TCGA9AG18AG11AGAG2AG5CT17AG3CT3AG28AG10TC9AG2AGAG9TC2AGAG11AG9AGGA8GTGA1CT3AG10GA6TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG6AG1TC2CT7AGAG2CA12AG6AG31AGAC1AG7AG1GA10CT5AG10AG8AT8AG16AG16AG52GA6TC11CG1TC6AG53AG5AG7AG21AG4CT18GC28CT3AC1CT19AG11TC9AT21AG1CTAG4AG4AGAG10AG2AG3AG1AGGA15AG1TA14TC9AG8AG13TAAG27AG48TC2TC51AG35CT14TA18AG22GA1AT71TC33CA4AG6AG58AG3CA21CT2AG5AGAG7CAAG1AG3AG1GT4CT19AC1AC6AG2CT22TC3AG3AT2AT13AC8AGAG32AG2CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC5AG8TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG7AG5AGGA2AG16CTCT12TC4CT2TC2-T10AG6AG9GA5ACAG3TC22AG17CATC9AG3AG14AG4TAGA10AC16CAGA24CT4CT7AGGC29AG19TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2GCAC5CT8CT2GC13GACT24TC6TA1AC10AG6TA11GA18AG5AC3GT33CA-G3GA1CACT1ATGC2GC1AC2AG1C-C-1CG1CGTA1-G-G-G-G9AG4TC1TA2TC5AGAG3AGGT1AG5AC8CT1-C-A-G1CA2CA4AG16AGAGAG8AG1AG3AG8TC38GT6AGATGA10AG3AC2CA25GA6GA7CT3AG1AT14CAAT10AG18GA28AG24GA3CT18CG6TG9A-A-2TG2AGTACA1AG1C-T-1GAC-C-4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5AGT-G-A-A-A-2AG8AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT9AG2GA2GA11GA1AT4G-T-A-A-A-A-A-T-A-4GCGA2A-A-A-6AT3TC2AG24AG21AG18TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT4CT18AG2AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT2GC2CT2AGCA1TA4AG2GA4AG8GA4AG11-G2AC2GA2TGA-4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA6CATG13AGAG8GA2AT2GA1TC3TC12AG3AG19AT7GA16AG1ATAT11AG1A-A-T-8TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGATAG1GA35GACT2GATC10AG1GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA3AG5AG9AG8AG7AG22CA6AG8AG2AG11CA1TG20AG1AGGA12AG1AGAG2CA1TA1AG6CG6AG7AGAG19AG8GC3GA10AG41AG14AG40AGAG22AG1GA8TG1AG14AG14AGAG6AGAGAG29AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AGAG2AC1AG7GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA1AG11AGAG4AG4GA4TA3CA1GT1AG3AG1AG10AT10AG6AG8AG2AG17AG2AG4GT13AG9AG5CT8GA2AG2GT7TA11AC3AG18AG3CT7AGGA4AG2AG3AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC13AG12AG4CTGAGA4AG5AG8AG8AGAGAG2AGAG5AC2GC2GA4AG2AG9GA7AG10AC13AT14CTAG7AC15AG9AGAGAG11TG5AG3GCCT1TG11TG11CG1CA16AG4AG1GACT13AG3AGAG5TG5GA3GTCATGCTAGAT1GACT1AG8GA1CTAG3AG3GA1AG3AG9A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-9AG3CA2AG3AGAG20AG3GA10CA1TC31AC1GTTG6CG12CG2AG2A-A-A-2AG5AGAG12GC18GA15AGGC4CG5AC22AG11TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC3AG3AG5TA18TG8AGGA12GA1GATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG1AG5GT3GCACAGCG1CG8AG2GACG35AG1AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 -MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9719,543,8665,9207,1,542,1.27e-164,578,87.293,474,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC3AG3AG5TA18TG5TG2AGGT7GA4GATCGATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG7GT3GCACAGCG1CG8AG2GACG37AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 -MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9719,151,1,150,781,631,2.96e-50,198,96.026,145,minus,22AT3CT21GC23-T41TC12AG23 -MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9719,9036,155,9136,649,9627,0.0,10637,91.479,8266,plus,18TGAGGA85-A-A-A49TA24ACAG27AG10GA57CT2CT5TG9AT4GA2AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC13ACGATC1CG2GACT20GT12CA31GA23GA20CT2TC8GA2AG23GA95GA42GA13AG50AG10CG11GA27CT32GA30TC9AG49GATCCT17AT2GA5TG26AG14AG41AG2AT35GA2GA14AG42AGAC2TC41CT35TC50GA68CA18CT38GA13TC5ATGA6GA7TC18GA1GA9GC11GA9AGAG40AG41CT97CTTC68CA6TC19TC20TC8AG12CA88AG8AG8GA95GA11AG41CT20GA6AG35AG11AG43TC85TC24GA38CT53AG11CTTC6AG7TC1GT11TC20CT8GT59CA5TC27CT7AG26TCGC13GA2AG19AGGA3GA7GA11GA4AC39GA2AG59GATA22GA50GA10CT7AG64GA14CT4GA9AG8GA2AG11TA2CA11AG23CT14CT32AG5AG8TC2TA14TC23TC37GACT14GA6TA31AGCT1GA10GA6AT11AG39CT7AC18ACGAGA12AT39GA6CT2TG77CA8GA23GT2GA16AG66TC11CT8GA10CT37TC88GA8AG11CT2CT2CT17GA8GA3GA10AT8AC1CG10AG12AG18AG2GA13GT3CA71AG35CA93CA19GA46AG4GA25AG2TC2TC141CA32CTAG5AGAG6CTCAAG29AGTC35GA74AG17CG3GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG59AC22CT5AG10GAAT25CTAT5TC8GA2AG33AG14TA31TC2-T15CT1AG16AG1CT43TC34GA3CG10AT14AG2CT34GC46CG3CA3AGGA18TCATCT5CT9GA7TC6TC4TC1CTTA2TCACTA3TG2AG23GACT4TA17GT8CA12AG11AG6GA1GA6TC15AC7TA2GA32TACAAT1GT-C2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC12AG13AG4AG2GA4CACA1GA1GT35GAAG7AC37AGGA8CT55AG5AT1AG1GT6AG6GA16GA3AG10TA38TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CG-C-G-G-G-A-G-A-A-T-G-A2CA1TG1GA-G-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG2AC1AG6GTCAGT3CT11AC5TA2GA2GCAC7GA1AT2G-A-A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT34TA21AG8GA13AC5GA5ACGA26GA19AG55AG1GA10AT4AT4AG6AG6AC13TC4GCGAAC1GT1CTAG2CG5TATACT4TC27TA2ACACAG3-C-C-A-G-A-G19TGATCT4CT4GA1T-A-T-7GA1CT2AG2GA21GA1-A-G-C3TA28CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT16GA8AG26CT5TC9TA2TCCA15CT3ATCT3AT1A-T-G-5GT1TG3TAGC-T1CA1-G-G3TA3GA1TC3CG1-A-G3-G2GATC1ACTA5AC4AC25CA8GAGA44AGCA3AT20GC1TA14GT2GT2GTGATGGC1TATC5AGAT1TC4CT3TC15AG6AG3TC37GA16AG19AG14AG5GA11AG3CA1GA6AT25CA20GC5AGGA9AT11GA1GT19AG42TC25TC18GA23CA16AG2AGCA35AG14CGGC7GA1T-G-G-G-C-A-3CT3ATAC3AG2TAGC1CG6GAGA1AC3TC18AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG28CA34GA5TA2CA1AT18AT69AG15CT11AG10TA7GA1TC9GC27GA17AG2GA7GAGT17TC3AG20AG35CA17GA1TCCG62GA5CT29CT11CTAG7TC4TC9AG12AG1AT6AG2TG5AG2AGTC1GT8TA3TG12GA17AG6GACT38AGGT1GA8ACAC1GA1AT2GA14A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-G-G-G-A-22GA17AC14TC8CA1TC8GC14TC7AC31G-A-T-19GC21CA8TC2AG6CG7GT39GA2TC9AG3GA41TC10GA25AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT23AG7CT3TA21CA12AG11ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G21CT22GC18-T56TG45 -MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9719,542,8609,9136,1,542,1.63e-174,610,89.852,487,plus,11GA2TC8ACAG3GA41TC10GA36CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT6GA16AG7CT3TA21CA24ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG21CT22GC18-T56TG45 -MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9719,9144,312,9387,577,9686,0.0,10905,92.104,8422,plus,25-G-A-C3-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23C-TA1TA2TG1AC2A-2GA1T-C-C-C-TG1TG3TGCGTGCATA1GC3TA2CA2C-C-G-AT4GC1T-A-2TGACGAAG5AG18AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25 -MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9719,654,8787,9414,1,645,0.0,705,88.532,579,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,9385,125,9411,380,9718,0.0,10753,90.581,8501,plus,41GC19CT1CT3TC53GA104AC10CT37CT11TGAGGA11AC37AG22CT12-A-A2TA62CA9AC7GA38GA44GA29GA8GA23GA8AG19AG8TA7AG5GATC3TC5CT2AG14TGGA20CT2AG1TC35GA27AC6GA4A-G-C-A-G-T-C-A-A-30CAATTC15TC7TCCA58CA2GA2AG80GA57TG10AG59GA39CA47AC4GA31TC30AG5TC8TC47AG62CT3CT10AG8AG38GA2GA6AG4CT2AG8CT22CT4G-G-T-GAGA1GT2AG3AC14AG19GA4AGCACT1AG32CATC3TC68CT2CTTA28AG12CT22CT2CT4AG41TC5AT10GA24CT18CT2CATA9AGAG29GA84AG60AG4CT40AG44AC31TC8AG20AG80AG56CA20GA2TC17GA17GA8AG14TC5GA59AG20CT8TC9AGGA6AG28CTTA14CA8GA50TC14GA11AG35CT17AG2CT22AG10GA5GA5AG1CG6GC1GA18TC19GA20TC11CT92AG26TCGC15AG21GA3GA1TC2GA14GA3AC26TC68GA28TC8CA44GA10CTAG29GA8AG5TG9GA7GA9GA12TC11GA1TC1AG8GA2AG22TCGA41CT1GA15AG47TC23TC2AG9ATAT22GA1CT8GA9AG2CA2TC41CT19AG65CTAC1GA50GA8CT3AG61AT12AG10GA20GA2AT2TA14TC10AG22AC1AG8GA11GA3AG31GA72AG16CT14GA2CT26GA20CT3AC1CT31TC9AT2TC5TC12AG1CTAG4AG2CT1AG9CT8AG2TAGA1TC8GA38GA124AG4TA17AG35CT56GA13GA14GC44AC2CA8AG100CT20AG5AGAG8AG7GT4CT5CT12AC48AG57CT37AG17GACA21AC4CT2TC5TC11AC12CA1AG3AT10TC1GT6TC5TG38GA6CT12TC4GA2GA34CTGA3GA29GA5TC14AG6TC11GA7AG19GAGT24GAATAT9AG7AG26CT14AG1GA15AT9TC1AG8TC19AGCA8GA6AG1-T3-C-G-A-C-A7AG14CA14GA2AG28GAGA3CG6AC21CT20CT4CT2AC3GA1GC31CA5AC5GA2CG3CA2GAAGGA9TC8TC1CT5CT4AG27TA2GCACGA3TGCT23TC1GACT22AT8CA2TA4GA17GA4AGGA11AG6AG5AC3GTTA32CA2GA2TACAAT1GTAC2AC1-C4CG-G2CA1CGTGTGAG-G12GA2TA10AG24-G-A2CA1-T37AG2TA17CT33AG44GA17CT3AT17AT3TC3GT1AG6AG7GA57CATACA9TC7CT1CG6TG9GTCTTG2CG1T-C-1CTCG1GTC-7ACTC1GA3A-G-A-2AGGT1AGGC1A-A-6AT1T-1CT1TA4G-G-A-G-A-C-9AG23GC1CGTCTA7GA2CA1AG4TGCTTG6CG2CTGA4CT10GA6GA1GAGA3AC7GA1G-A-C-1AG3AC2ACTC2TC4GA5TC19GA1CT8TC20TG5CT2TC38GA13ACAG22AC35AGAG2TA5GA5CT17TC17AG3AG1GA10ATAC9AG22GA8GC3CT5CG40GA2ACAC4GC-C-A-G-A-G-A13TC1AT2TGAT1GA3CT4CA1A-A-T-7GA4AG3AC10CT15GA9CAAC8GA7TC2CGACCA8AG1GA2GA1-T-T2-A-A-A-T4GA3CA11CGTCCA27GA1TC16AG23AT5AC4AG15CTCTA-C-G-14AGT-A-A-16GA8-G-G-A-A-G-T-G-A-C1TC6AC5GA18GA6GT7GA7CA24CAAGAT11TA27CT2GATCTA11AT1TA2AG2CA2GA4ATGCC-A-A-5CT60GA83GAC-T-G-6AT11CT34GC3GA5TC11AG6TA21AG12CT22GA35AG15CA4AG18CA16AG29CT9AG13CTAG15GA4TCATTG3GC1TG8CTAC3TC18AC1AG7GA11GA8TC2AT11AG7GA8GA4TAAG12CT5TGCA3GA5GA8CTCT16TC27AT26AG58CT8GA2AG2GT7CA2GT4GA4AG22AG2TC8GA9AG17ACGA1GT10CATC4TC3CG6TA13AG2AG25AG13AC11GATC4GA8AC49GA5CT12AC14AG1CT11CT8TC26AGAG1CT4GA10AG2AG4GT6TA2ACTG12GA17TG6GACT19AC2AG10AGGT4GT1GAGT10GA12AG5AGGA3AG16GTGA28CA3TC29CGACGT6CG3AC24AG5AG5AG2CT10GC3CT11GA26GA3AC1GT52AGGA29TC29AG2TC42GT6TA4-C4-A-C-C-A2-T1TA3CA1-A1CATA1TA1GATGGATA2CGTG1TCGAGA3CATG-G5TA1CA1-C-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA3AG1AT-G-G2CGTA1-C-C-G-G-A-G-A-G-A-G-A-A-G-T-G-T3C-5CA1CGCTCTGTAG4GCGCAG3-A1AC1ATGTCTGC1-T-C1AC2AG1ACAC1CG4GCAT1-C3TC-G-G-A-G-T-A2CTGC1CA1CA1GC-T-G-C-T3-A3-A7GA-C-A2CG1-A-C-T-T-T-C3ATCGAG1CG1-C-T-T-T-C-C2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,635,8840,9411,1,634,9.31e-121,432,76.535,486,plus,23ACAGGA29TC25GA3AG2TC18GA23GT6TA4-C4-A-C-C-A-GGT2TA3CA1-ATGCATA3-A1TAGATGGA1CGTC1TAGAGCTA2CGTG5TA1-A2-A-G-C-T-T-G1CT1GC3AC1TG1TG2TC1AT2GA5-T-G-G-A-T-G-A-C-C-C-G-G-A-G-A-G-A-G2TGCTTGCT3C-5CA1CGCTCTGTAG4-C-C-G-C-C-T-A1GC1-T-T-T1CA1GC1-C1AT1-G-C-C3AG2-C1AGGC1AT2AG3GT1GCAT2TACATGCAGAACCT2AT1GAACCA3-A7-A-C-A-A-G-G2-C-T-T-T-C-C2-T1CG1CG2-TATGT1AC2AG1GACG41GC19CT1CT3TC53GA104AC10CT17 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,255,125,379,9464,9718,5.83e-95,346,97.255,248,plus,41GC19CT1CT3TC53GA104AC10CT17 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,211,8973,9182,544,749,1.01e-65,249,92.417,195,plus,62AC10CT49TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,151,1,150,604,749,4.57e-39,161,88.742,134,plus,2AC10CT37CT11TGAGGA11AC27-A9AG10CA1TG3C-T-G-4G-G-5GT4 +MK114705.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9411,9718,91,8973,9063,9628,9718,9.52e-29,126,97.802,89,plus,62AC10CT17 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,9376,104,9441,402,9682,0.0,9757,86.775,8136,plus,19GC21CT24GA78TC55GA1TC1A-A-AT1CT1GA2C-2AGCTCGAT1A-2GA1CACT1ATGC37TGAGGA8AG2AC49AGAG22-A-A-A1TA11AG15AG4AG20GA3AG1AG12AC3AG3GA7AG10AG2AG15GA17AG8AG3AG43GA8AG3GA3TC1AG1AG25AG37CA10AG3AG7AG6TGGA13AG5GT8AGGA4AG26GA11GA12AG2AC4ACGAGACT3AGCT3TC7TA16CA1AC2AG8AG37AGAG17AG2AG17AG53TC14AGAG1TGAG4CT8TC15AG2GATC9AG13AGAG6TG1AG15AG22AG10AGAGAG14AG29AG3AG7CA20AG2AG1GA13AGAG5TC2AG3CT15AG22TC1AG7AGGA3AG1GA5AG25AG13TC8AG8AT5AG1AG10AG7AG10AG5GA5AG2TC11AG17AG8AG32AGAGAG4AG2AG13AG4AG6AG19CT4GAGA1GT4CT1AC26AG13CACT6AG21AGAG5TC5AG8AG8AG6AG7AG5AG1AG4AG3AG14AG4CT3AG20AGAG3AG12CT4AG10AG3C-T-2C-C-T-C-A-A-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-6AG9AG2TC1-G-G-G1AT3AGGA11TC14AC1AG11GA9CT13AG20AC17AG1AG1AG10AG5TC5AG31CA2AGGAAG7AG3AG2AG16AG1AGAG5AG2AG19AG5AT3GA3CT9TCAT1CTAG4CT9AG7GA30AG20CA2AG8CT13CT2TC8AG24AG7CT19AG6AG41AG2AG5AG3AGAG16AG28GA20TCGA1CT7AG2AG32AG9TC4AGAG3AG8AG1TA11TC3AGAG1CT19CA8AG5AG30AG9AG3AG42AGAG15TC14AGAG3AG4AG34GA3CT16GAACCA30AG15AG17AG4AG12GA2AG4AG5GA8AGAT6AGAGAG2TC19GA2CT11CT10AG4AG1GT41AG14AC2TC1AG27AGAG1AG10AG15TCGC2AGAG9GA1AG12GA7AG1AG11TC11GA44AG13TA9AG3CTAG12GT4GA15CA10AGAG1AGGC4TC2GA21AG16AG7AGGA13CT2AGAG8TC14GA11AG15TA10TC10AGAGAG3GA14GA1TC1AG11AG7AGAG7AG9TG16AG3CT3AG3AGAG8CT2CT22AG12AG12AG2AG23AGAG9TC1AGAG2TG1AC5CT1AG8AG11GA1CT3AG20AC3AC18AG5AG8CA3CT7CT5AG5AG2GACT28GA9AGAGGA21AC21GA12AG15AG4AG5CT7AGAG2GA5CA6AG5AGAG1AG10GA3AG5CT11AG6AG19AGAG6AT2AG8AT2CA3AG1AG16AGAG3AG11AG10AG6AG47AGAG6TC6AG1GA20TA8GA22AG4AG7AG21AG19GT11GA3AG4AG11CT3AC8CT5AG28AT9CA11AG2AGAC3AG2GT1AG11AG2AG3AGAGAG9AG6AG1TA25AG7AG7AG5TA18AG4AG4AG10AG66AGAG2AG10AG30AC5GA43AG11AG10GA9AG18TC15AGAG21CT35AG7AG7AGAG13AG31AG28TC11AG5AGAG6CT1AG1AGAG2AG1GTCT9CT2TC2CT4CG1AC28TC11AG1GA9AG16AGAG19AG12AG2CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT39AG3AG23AG19GA26AT1AC12AG7AG21AG9AGAG6TC9AG18AG10GAAT17CT5AGCACTAT5AC2ATAGAG1CT2AG1AG3TC17AGAGAG9AG2AG4AG27AC10TC12AGAG5AGCA15AG2GATC2TGGA2AG2AG12AG13AC14AG23GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT11AG2AG17TA2ACACGA3TG26GACT20AG1AT8GAGT4AG6AG27TC2AGAT5AG5AC3GT1AG28CT3-G-G-A-G3GT5GC1ACG-A-A-4CGAGGACG1C-1TG1TGAG2AG2AG2AGAG5GC9AGAG22GA1GA5TA4AGAG16AG11AGAG1GAAG2TA4ACTC11CT32AG13AG30TC8TA7AT4AGAT21TC4AG7AG10CA22AG6AG22CT6GA16CG6TG11AG2AG3AG5GAT-A-G-G-1AT1TC3ATCAAGAT1TG2TG1AGTGCGTACG5A-A-C-4AGCG1AGT-A-C-4AG1AG3AT1T-G-1CA20CG4GAAGGC7AG3AG4GAAG12CT17GA1CA2GA11AT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG3AG7AG8GA5ATGA2GA3TC7AG5AG9ACGA27AG7AG8GA21AG1TC2CT9AG2AG2AG5CA9ATAC8AG6AG6ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C2AGAG7AT2TGAT1GA3CT1AG2CA1G-A-T-5AG1GA4AG20CT3-A3ACCA1GA2TG3G-1GA9GACAAC1AG4TC1GAAGAC7AGGA3AC5AG4AT26AC3AG3AG4ACTC8AT19AG3AG18CTAT6GA18A-A-2G-7AT3AT1CG1-G2-C-T-G2CGAG1-T-C2CA5AC1AG2-G-G2TG-T-G-A-C-A-C-A5AC5GA20CA4GT7GA5AG22TC6AGAGGAACTA6GA2CT17AG2AGAC14AG2AG3CAAT1CGTC2TC1GA1AG1AGGTACAC4CT10AG3AG1AG2AG6AG8AG21CT17GA6AGAG19CA1AG4AG3AG21AG1AGAG3C-G-T-8AT7CTAG7AGAG2AG16AG8GC3CA10AG5AG29AG12CT6AG22AC18AGAG8AG15GA5TG4AG12CA1AG15AGAG6AGAG8AG20AG9AG4AG6AG3CT9T-A-1AT1TG1CA2TGCA1ATAT1-G-A2AC3TC5AG4CG3AG13CA1AC10AGGCAT5TC2ATAC4CA2AG12TA3AG2GAAG11AC10AG3CT5CA4AG4AG5AG5AG5GATC8AT5AG1AG10AT25AG3AG6AG4AG11TC25AG5CT11AG2GT7TA12AG2AGAG4AC12AG3TCAC13AG1AG12GA8GTATAC9CATCAG3TC3AGCG4CT4AGAG5CT4AGAG11TC13AG3AG1AG18GACATC2AG2CT4CG2AC4AG4AG2AG1AGAG2AGAG2GAAGTC6GA2CT1AG2AG2GA6GA7AGAG1TG37AG3TC3TC2CA11AGAG1AG7AGAG12AGGT4AGAG1AGTC1AT1CT6TA3TG14AGGA8AG5AG4AG1GACT5AT4AG2AGAG9AG10TA2AG2GACT1AG3AG4GA6AGAG8A-G-A-A-A-3T-T-A-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-A-G-A-A-A-G-A-2AG17CA2AG3AGAG17TC1AG6TC2AG23TG2AG4TC16AG18AG2AG2AG2AG2CT10GC6AG26AG6TG2AG47TC1GC5GA11AT9TC5GA1TC14AC17AG14AG12AT24TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG11AG7AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,598,8845,9441,1,598,0.0,659,88.629,530,plus,14TC1GC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA5AT24TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG11AG1GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG6AG12AG17TC7AG3AG4CT1AG20GC21CT10AG30AG19AGAG86-G5 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,201,104,304,9486,9686,2.55e-74,278,98.010,197,plus,19GC21CT24GA78TC55 +MK114856.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9477,9718,111,1,111,627,736,2.52e-31,135,92.793,103,plus,40TGAGGA8AG2AC45C-1AC3TG4 +MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9718,9077,150,9207,636,9626,0.0,9759,87.937,7982,plus,31AG41-A23CG21GA3TA38TG20CG3AG8AC3AG10TCAGCGCT9AGAG16GA17AG30CT2CT14GATA13CT2GA5TA2AG15GT50GATC9CT2AG12AG1TGGA20CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC11AG8AGCG1ACTA24AG10AG28AG18CT8AG41AG1AG20GA11AG11TG2GA10AG7TG19CG22AG9AG20CT24AG3AG7CA28CT20AGAG1GACT4CT24GATC7TC14AG7AG10AG3TC11AG16AGGA2TC8GT8TG10AG18AG14TC14CT14AG8AG6TC32AG13CT41GT5CTTA7AGGA4AGGA12AG14AT28AG1AG10AG17AG6AG7AGAG6AG8AG23AG6C-1G-A-C-T-A-A-G-A-C-13AG7TC9CT15AG9CT26GA4CA14TC2AG2AT4GA5GA4TC15AC3AT4CA1AG15GA10AG20AC1ACAG1ACTA7AG5AG11AG47AG1AG11AG2AG16AGAGAGAG5AG2AG29GA3CT9TC30AG10GA2AT12AG16CT3CA2AG22CT2TC8AG21TC7AG3AG6GA36GA6AG11GA4AG2AG9AGAG7AT8AG7GA8TC44AG1AG16CA19AT10AGAG9CT2AG49AG5AG23TC5CTAG10AG23CT15GA6AGAGGA3AG25AG3AG4AG55GAGC31AG15AG18AG6CT14AG2AG17AG5AG5CT14GA12AG10TC4AG3AGAG24AG16CGAT9CA10AG27AGAG1AG2GA7AG6CT5CT2TC4AG11AG46GA72CTAG33GA11AG2ACGA2AG5AG44AGGA13CT3AG26GA24GA2CATC4GACG12AGAG22AG2TC8AG7AG1AG3TCGA9AG18AG11AGAG2AG5CT17AG3CT3AG28AG10TC9AG2AGAG9TC2AGAG11AG9AGGA8GTGA1CT3AG10GA6TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG6AG1TC2CT7AGAG2CA12AG6AG31AGAC1AG7AG1GA10CT5AG10AG8AT8AG16AG16AG52GA6TC11CG1TC6AG53AG5AG7AG21AG4CT18GC28CT3AC1CT19AG11TC9AT21AG1CTAG4AG4AGAG10AG2AG3AG1AGGA15AG1TA14TC9AG8AG13TAAG27AG48TC2TC51AG35CT14TA18AG22GA1AT71TC33CA4AG6AG58AG3CA21CT2AG5AGAG7CAAG1AG3AG1GT4CT19AC1AC6AG2CT22TC3AG3AT2AT13AC8AGAG32AG2CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC5AG8TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG7AG5AGGA2AG16CTCT12TC4CT2TC12AG6AG9GA5ACAG3TC22AG17CATC9AG3AG14AG4TAGA10AC16CAGA24CT4CT7AGGC29AG19TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2GCAC5CT8CT2GC13GACT24TC6TA1AC10AG6TA11GA18AG5AC3GT33CA-G3GA1CACT1ATGC2GC1AC2AG1C-C-1CG1CGTA1-G-G-G-G9AG4TC1TA2TC5AGAG3AGGT1AG5AC8CT1-C-A-G1CA2CA4AG16AGAGAG8AG1AG3AG8TC38GT6AGATGA10AG3AC2CA25GA6GA7CT3AG1AT14CAAT10AG18GA28AG24GA3CT18CG6TG9A-A-2TG2AGTACA1AG1C-T-1GAC-C-4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5AGT-G-A-A-A-2AG8AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT9AG2GA2GA11GA1AT4G-T-A-A-A-A-A-T-A-4GCGA2A-A-A-6AT3TC2AG24AG21AG18TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT4CT18AG2AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT2GC2CT2AGCA1TA4AG2GA4AG8GA4AG11-G2AC2GA2TGA-4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA6CATG13AGAG8GA2AT2GA1TC3TC12AG3AG19AT7GA16AG1ATAT11AG1A-A-T-8TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGATAG1GA35GACT2GATC10AG1GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA3AG5AG9AG8AG7AG22CA6AG8AG2AG11CA1TG20AG1AGGA12AG1AGAG2CA1TA1AG6CG6AG7AGAG19AG8GC3GA10AG41AG14AG40AGAG22AG1GA8TG1AG14AG14AGAG6AGAGAG29AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AGAG2AC1AG7GA11GAAG1AT5TC1TCATAC10CG4AG2GA5AG6CA13CA7CA9GA1AG11AGAG4AG4GA4TA3CA1GT1AG3AG1AG10AT10AG6AG8AG2AG17AG2AG4GT13AG9AG5CT8GA2AG2GT7TA11AC3AG18AG4AC6AGGA4AG2AG3AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC13AG12AG4CTGAGA4AG5AG8AG8AGAGAG2AGAG5AC2GC2GA4AG2AG9GA7AG10AC13AT14CTAG7AC15AG9AGAGAG11TG5AG3GCCT1TG11TG11CG1CA16AG4AG1GACT13AG3AGAG5TG5GA3GTCATGCTAGAT1GACT1AG8GA1CTAG3AG3GA1AG3AG9A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-9AG3CA2AG3AGAG20AG3GA10CA1TC31AC1GTTG6CG12CG2AG2A-A-A-2AG5AGAG12GC18GA15AGGC4CG5AC22AG11TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC3AG3AG5TA18TG8AGGA12GA1GATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG1AG5GT3GCACAGCG1CG8AG2GACG35AG1AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 +MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9718,543,8665,9207,1,542,1.27e-164,578,87.293,474,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC3AG3AG5TA18TG5TG2AGGT7GA4GATCGATA1AG9AC1TA8ACGA3CT1ATAG1AG7AG7GT3GCACAGCG1CG8AG2GACG37AG23TC1AT4GA10CTTC3AC2TG6AGAG11AGAG10G-14AG3AG4AT1AG20GC21CT10AG9AG20AG19AG37 +MK115009.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9207,9718,151,1,150,781,631,2.96e-50,198,96.026,145,minus,22AT3CT21GC23-T41TC12AG23 +MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9718,9035,155,9136,649,9626,0.0,10641,91.489,8266,plus,18TGAGGA85-A-A-A49TA24ACAG27AG10GA57CT2CT5TG9AT4GA2AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC13ACGATC1CG2GACT20GT12CA31GA23GA20CT2TC8GA2AG23GA95GA42GA13AG50AG10CG11GA27CT32GA30TC9AG49GATCCT17AT2GA5TG26AG14AG41AG2AT35GA2GA14AG42AGAC2TC41CT35TC50GA68CA18CT38GA13TC5ATGA6GA7TC18GA1GA9GC11GA9AGAG40AG41CT97CTTC68CA6TC19TC20TC8AG12CA88AG8AG8GA95GA11AG41CT20GA6AG35AG11AG43TC85TC24GA38CT53AG11CTTC6AG7TC1GT11TC20CT8GT59CA5TC27CT7AG26TCGC13GA2AG19AGGA3GA7GA11GA4AC39GA2AG59GATA22GA50GA10CT7AG64GA14CT4GA9AG8GA2AG11TA2CA11AG23CT14CT32AG5AG8TC2TA14TC23TC37GACT14GA6TA31AGCT1GA10GA6AT11AG39CT7AC18ACGAGA12AT39GA6CT2TG77CA8GA23GT2GA16AG66TC11CT8GA10CT37TC88GA8AG11CT2CT2CT17GA8GA3GA10AT8AC1CG10AG12AG18AG2GA13GT3CA71AG35CA93CA19GA46AG4GA25AG2TC2TC141CA32CTAG5AGAG6CTCAAG29AGTC35GA74AG17CG3GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG59AC22CT5AG10GAAT25CTAT5TC8GA2AG33AG14TA31TC17CT1AG16AG1CT43TC34GA3CG10AT14AG2CT34GC46CG3CA3AGGA18TCATCT5CT9GA7TC11TC1CTTA2TCACTA3TG2AG23GACT4TA17GT8CA12AG11AG6GA1GA6TC15AC7TA2GA32TACAAT1GT-C2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC12AG13AG4AG2GA4CACA1GA1GT35GAAG7AC37AGGA8CT55AG5AT1AG1GT6AG6GA16GA3AG10TA38TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CG-C-G-G-G-A-G-A-A-T-G-A2CA1TG1GA-G-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG2AC1AG6GTCAGT3CT11AC5TA2GA2GCAC7GA1AT2G-A-A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT34TA21AG8GA13AC5GA5ACGA26GA19AG55AG1GA10AT4AT4AG6AG6AC13TC4GCGAAC1GT1CTAG2CG5TATACT4TC27TA2ACACAG3-C-C-A-G-A-G19TGATCT4CT4GA1T-A-T-7GA1CT2AG2GA21GA1-A-G-C3TA28CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT16GA8AG26CT5TC9TA2TCCA15CT3ATCT3AT1A-T-G-5GT1TG3TAGC-T1CA1-G-G3TA3GA1TC3CG1-A-G3-G2GATC1ACTA5AC4AC25CA8GAGA44AGCA3AT20GC1TA14GT2GT2GTGATGGC1TATC5AGAT1TC4CT3TC15AG6AG3TC37GA16AG19AG14AG5GA11AG3CA1GA6AT25CA20GC5AGGA9AT11GA1GT19AG42TC25TC18GA23CA16AG2AGCA35AG14CGGC7GA1T-G-G-G-C-A-3CT3ATAC3AG2TAGC1CG6GAGA1AC3TC18AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG28CA34GA5TA2CA1AT18AT69AG15CT11AG10TA7GA1TC9GC18TCAC7GA17AG2GA7GAGT17TC3AG20AG35CA17GA1TCCG62GA5CT29CT11CTAG7TC4TC9AG12AG1AT6AG2TG5AG2AGTC1GT8TA3TG12GA17AG6GACT38AGGT1GA8ACAC1GA1AT2GA14A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-G-G-G-A-22GA17AC14TC8CA1TC8GC14TC7AC31G-A-T-19GC21CA8TC2AG6CG7GT39GA2TC9AG3GA41TC36AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT23AG7CT3TA21CA12AG11ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G21CT22GC18-T56TG45 +MK115387.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9136,9718,542,8609,9136,1,542,1.63e-174,610,89.852,487,plus,11GA2TC8ACAG3GA41TC10GA36CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT6GA16AG7CT3TA21CA24ACAT11TA2AT3AGGA11AC3TC2TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG21CT22GC18-T56TG45 +MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9718,9143,312,9387,577,9685,0.0,10915,92.136,8424,plus,25-G-A-C3-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23C-TA1TA2TG1AC2A-2GA1T-C-C-C-TG1TG3TGCGTGCATA1GC3TA2CA2C-C-G-AT4GC1T-A-2TGACGAAG5AG18AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25 +MK115491.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9422,9718,654,8787,9414,1,645,0.0,705,88.532,579,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT96TC26G-A-C-T-C-G-C-25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A23 MK116110.1,Ref.B.TH.90.BK132.AY173951,0,8967,8996,7800,1191,8938,1230,8996,0.0,8979,90.526,7061,plus,2CG17-G-A-C7AG5GA33AGGA4CT15CT5TC3AGTA6TC5ACACAG15CT4GAAG13AG7CA13GA13GC3GA24CA19GA14CT20AG13ACGA27GA8CT14CA1GA7GA10TC1CT3GA2TG34TA7AGGA37AG27TAGA11AG65CTCTAG9AG24GA3GA47AC4GT17CT11CT16GA28AG76GA8GA30AG55GA11GA11TC17GA8GA11AG2AG20AG35AC14TC5GA20CG3GATC79GTCG15TC14GA2GA14GA5TC18CT1AG3AG13GA3TA4AG8GA29AG11GA14CT2GA2GA23CT8GT32GA6AGCTAG5AG41AG8AG20TCGC15GA21AG9TG27GA46CA1GA32CT12TA4AG8AG8GA5TA5GA11AG14GA11GA11AG1AG4AG29CG4TA41AG11TC1GA63CT17TC17AG20GA5CG20AC8CA8AG2CT2TC5TG26TG3GA4GA12AG5CT22GA21TC8CT10AG4CT9CT6TA10GA6AT7TCCA19GA12TA6AG22AC10AG9AG7GA11AG57TC4CTTC28AG5GA50CTAG41TC16AG8AG44GA32GA14TA44TC3AC31CA26CT5TC2CT3GA7AG2CT14AG23TC38GA35GA5AG14GA23CT33AG31GA6TA10AG95CT2CG35CT5AC41CT36GA20TAGA10CT8GA9CT9GA5TC1GA2AG5GT1TG4AG10GC4TC1CT1AC25CT11GA2TG5AC2AGAGAT5CAAG32CA11CT2GA20AG3AGAGGA2CA5TC14TA1AGACGC16CT44AT6GT9GT48CT15TC2GA8GATG2AC1TC4AG4CT18CT4CG3GA5GA25GA11GA5GA2AG5TC9GA27GAAT14TC2CT7TC6TC2GCAG1CA5AG5CTGA9CA9TC6AG10AG15TC8AC7CT11AG10AG20TC2GT2GA1GA5AG20CT5CA4CA12CT20TG7CA2AC15GA2CT5AT28GC46CG7AGAGGA1AC2AC2GA8AGAC1CT5CT14AGCT6CA5AC5GA6GTGT2CG20GC1AGCG24TC6CA30AG9TC2AGAT4AT9GA40CT8GA2AG8GT5AG1GT7GCAT10AG2GA8CTTA11AGCA36AG5GA53GA20GA17GA21TG6GT13GA7TYGACTAG4AC11TC3GA38CTTC22CT5TC7TC3GACA11GT1CG1AGCA7-C-T-A-A-T-A-C-C-A-A-T-A-G-T-A-C-C-G-C-C-G-A-G7-A1AGTC2CA7CA1AG28AGAC4CGAG6GT1AG33GA17A-A-G-6G-A-T-2T-A-G-C-T-T-T-A-A-T-A-A-T-A-A-33TC5AC5TC38CT3AG12AT3AG7GA6CTAG2GA3CAAG11AC2GA7CA10TA2AG21GA9GA15TC17AG2CG1GA18CG7CTTA1GA7TC24GAAGCACA6AG7CT8GA2CT2TC3AT7AG5TA3CAAC1GACTAG10AG4ATTA4GA30AG9CT9-A3G-2GA1GA6GA1TC19CA7CA11GAGAGC5AT11CT2TGCA4GC25CTAG10AT18TC1AT13CA24AGTC1AC2GATAAGCGTA3-G2TGTAGT1AG1TG2TG1CA2GAT-17TC1AG5GAGA21AG22TC9CG1TA10AG3TCTA1AC35TA6GC1GA1GA2AG2GC1-A-A-C-G-A-G-A-C-T4CT12CA6GA26TC21GA16CG50AG1AG4CT1C-T-G-27AG29AG22GA1AT21GA19AG48TC2AG18CT1GA18CA46TC35CT12AG4AG6GA17GC1GA7AG8GATC9CGAGAC11TC17GA1GA3GA16AT3AT3TC2GCCA1CT7GA4ACCA2CT7GA7AGGATC8AC41CA2AGAG4GT9GA22AG5AG14TC8GA2AG10GA1TC30AG15CA22GC4AGCG9AGAGCACT9CG2CA9AT3CT3AC3GA47CT1GA24AG13AGTC7CT9GA9AG20AG2AT57AG11GT9CT2GA13CA8GATC4CA1AC5AG5AG5AG19GA15GTTG4T-2T-T-G-G-A-23AG5-A-A-C-T-A-A-G-C-C5GA12AT2GA10TC4CA10CA22AG7CG7TC7CA30-G-G-G12TC5TC1GAGA5AG33TC1GA42AC1GA2AT8GA35CT29CT11AG11GA2TC26AG9CG5AC4GCCA9CA5CA2GA3AG2GA21TA3AG15TA10GA6AGCT20AC4AG5TG7GTAG3ACAG4CATA18AG11CT1AG2TC3AC30G-24-G37CT5CT-T33TA22GA2GA45AC26 MK116110.1,Ref.B.TH.90.BK132.AY173951,0,8967,8996,1137,58,1194,1219,86,0.0,1395,92.964,1057,minus,2TC11TA2CT83TC41AC8AG17GA2TC48TC17AGCT3AG8TC28CT9AG2GA2AT5TC19TG48AG23TC13CT66TC8TG23AG16TA23CA15AG17AG50CT26GC1GTGA17GA8GA9TC1AG3CT3CT1CTCT18TC2CTAT4GA11CT14AC4GACA3CT12GT2TC7CT9TC12CT4CT16TC4CT8CT5TC2GA3GCAT3CT41TC2CT49GT9CT17TC7TG12TC6TCGTGA7TG57GTTC4A-C-T-25 MK116110.1,Ref.B.TH.90.BK132.AY173951,0,8967,8996,57,1,57,4,60,1.43e-11,69.7,91.228,52,plus,14TAAGGA8AG2TC28 -MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9719,9071,480,9481,576,9625,0.0,10861,92.239,8367,plus,26-G-A-C-C-C-T-T2-A-G-T-C-A-G-T-G-T-G-G-A15C-3A-1ACTC2G-G-C-TA1GA1TGAG2TCAT2GA1TG1CGTACA2TGAG2TA17GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9719,542,8949,9481,1,540,8.48e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9719,9035,70,9055,648,9621,0.0,10441,90.747,8199,plus,19AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA69GATC9CT2AG12AG1TGGA20CT6CAAG11AG20GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG13CA23GAAG28AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC8TC20GA2TC8GT8TG59CT14AG8AG6TC31GA2GA11CT47CTTA8GACT3AGGA21AG2GA2AT30AG4TC50GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA21GA10AG20AC1ACAG1ACTA6GAAG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA27CA8GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTCG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA20CA7CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA30CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC1CA26CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA25AGGACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT24GA23CT15TC2AG21GA2GT9CT5CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA20CT12TC4CT2TC2-T17AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CTCA7GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2ACAC5CT11GC14CT24TC6TA1AC17TA11GA24AC3GT27AG5CA5CACA-T1GTGC2GC1AC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT4AGAT14CAAT29GA53GA3CT18CG6TG9A-G-2TG3-A-A-T-G-A2AC6TC3TAAG2AG1-A-G-C-G-G-G-A-G-A-A-T-G4CT3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT4GA7GA2GA2TC8GA1AT4G-T-G-G-A-A-A-T-A-4GCGA2A-A-A-4GA1AT3TC2AG24AG12AG27TA30GA4GAATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC1CT5AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG19TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA11ACA-6TC2TGAC7AG4AC6-G-A-A1GT12GA7TG23GA2AT2GA1TC3TC36AT7GA18-T-T-T3GA5-T-G2TGAT1TC2G-2TG3-C-A-A-A-T-A-A-C6TGCG2AG1AG4TA5AC30TA8GA9GA12TC9CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CTAC5GA59CA18AG11CA1TG20AG2GA18CA1TA8CG44GC3GA52AG14AG66GA8CG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8GT1CG7AC1AGGA6GA11GAAG1ATCT4TC1TCATAC10CGTA3AG2GA5AG6CA13CA7CA9GA16GA7GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC26CT8GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11CG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA10TA5GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG3TG5AG5GT3GCACAGCG1CG8AG2GACG16TC18AG22AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 -MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9719,537,8519,9055,1,536,6.00e-175,612,89.944,483,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG3TG11GT3GCACAGCG1CG8AG2GACG16TC41AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 -MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9719,9023,565,9537,623,9625,0.0,10895,92.563,8352,plus,26A-C-T-C-TG4T-13TGAG20GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9719,542,9005,9537,1,540,6.18e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9719,28,370,397,622,649,0.002,42.5,100.000,28,plus,28 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,8984,200,9165,768,9676,0.0,10431,90.895,8166,plus,51CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC9CT2AG4CA7AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG2TA35AG28AG18CT73GA11AG10CATG2GA18TG19CG23GA29CT36CA25TA2CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA24GA2AT30AG10AG44GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG65CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC63CA19AT21CT52AG29TC5CTAG10AG23CT15GA7AGGA94GAGC55TC10AG6CT17AG18GA10CT38TC51CGAT9CA15AG25AG2GA14CT2AG2CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG47TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA2TA3CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGGC9AG12CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC110TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA19CTCT12TC4CT2TC2-T17AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2GA2CACA-T1GTGC2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-2TG2AGT-C-T-A-3CGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11GA1AT1G-T-A-G-T-G-G-A-A-7GCGA2A-A-A-4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA7GA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT14A-T-G-7CAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG1AG3CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC1CT8CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC26CT8GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT12CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA24AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1AT2AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,592,8574,9165,1,591,0.0,690,90.878,538,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1AT2AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,129,1,128,778,650,1.18e-41,169,96.124,124,minus,19AT3CT21GC23-T41TC17 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,72,130,201,623,694,1.90e-21,102,98.611,71,plus,44AG27 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,48,9167,9214,463,510,5.46e-12,71.1,100.000,48,plus,48 -MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9719,48,9167,9214,9548,9595,5.46e-12,71.1,100.000,48,plus,48 -MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9719,9068,648,9663,640,9643,0.0,10103,89.314,8099,plus,27TGAGGA62AG22-A-A-A13AG20AGAG13TA24ACAG27AG10GA57CT2CT5TG9AT7AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC8AC4ACGATC1CG2GACT20GT12CA31GA19AG3GA20CT2TC8GA2AG23GA95GA10AGAG30GA75CG2AG8GA27CT20AG11GA30TC9AG49GATCCT17AT8TG10AG15AG2AG11AG32AGAG7AG2AT35GA17AG42AGAC2TC41CT28AG6TC100AG18CA3AG9AG4CT52TC1AG3ATGA6GA7TC18GA1GA5AG3GC11GA9AGAG40AG5GA35CT17AG16AG17AGAG11CT30ACCTTC68CA6TC14AG4TC20TC8AG12CA7AG8AG3AG67AG8AG3AGAGAG2GA12AG61AG19AGGA11AG16AGAG12AG10CT6AG13GA6AG10AG5AG18AG11AG9AG33TC3AG9AG35AG4AG30TC24GA32AG5CT9AG17AG25AG11CTTC6AG2AG1AG2TC1GT11TC20CT8GT5AGAG52CA5TC27CT4AGAG1AG11AG14TCGC3AG9GA2AG19AG4GA7GA11GA4AC38AG3AG22AG36GATA11AG10GA50GA10CT3AG3AG64GA5AG8CT4GA9AG8GA2AG7AGAG2TA2CA1AG9AG16AG6CT4AGAG8CT25AG6AG5AG5GA2TC2TA14TC12AG10TC1AGAG12AG21GACT14GA6TA31AGCT1GA10GA6AT11AG39CT2AG4AC18AC1GA12AT46CT2TG4AG16AG5AG2AG32AG13CA12AG19AT2GA3AG12AG5AGAG45AG13TC11CT9AGAG8CT4AG20AG11TC34AG21AG31GA8AG11CT2CT2CT17GA1AG6GA3GA10AT8AC1CG10AG12AG11AG2AG3AGAGAGGA13GT3CA25AG45AG35CA93CA19GA46AG4GA25AG2TC2TC79AG61CA32CTAG5AGAG6CTCAAGAG28AGTC35GA34AG33AG5AG19AG1GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG51AG7AC22CT5AG10GAAT25CTAT5TC11AG22AG10AG7AG1GA4TA31TC2-T10AG4CT1AG16AG1CT24AG18TC34GA3CG10AT14AG2CT25CT8GC46CG3CA3AGGA18TCATCT5CT9GA7TC6TC4TC2TA2TCACTA3TG2AG23GACT4TA15AG1GT8CA12AG11AG6GA1GA6TC15AC7TA1AGGA32TACAAT1GT-C2GC1GC2AG1CGAGGACG2TGTG-G-G2AG5AG5TC10AG1AG13AG4AG2GA4CACA1GA1GT19AGAG14GAAG7AC37AGGA8CT11AG43AG5AT1AG1AT6AG6GA16GA3AG10TA28AG9TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CGTCTGCGTG1-G-A2AGCA2CA1TG-G2-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG1AGAC1AG6GTCAGT3CT11AC5TA2GA2GCAC7G-A-2AT2A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT15AG18TA13AG7AG8GA13AC5GA5AC27GA12AG6AG55AG1GA10AT4AT4AG6AG6AC13TC4ACGAAC1GT1CTAG2CGGA4TATACT4TC27TA2ACACAG3-C-C-A-G-A-G1AG7AG9TGAT5CT4GA1T-A-T-4AG2GA1CT2AG2GA21GA1-A-G-C3TA4GA23CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT5AGAG9GA8AG18AGAG1AG4CT5TC9TA2TCCA15CT1AG1ATCT3AT1A-T-G-5GTAGTG3TAGC-T1CA1-G-G3TA3GA1TC3CG1GAAGAGTA3AG1TC-A-C-A5AC4AC25CA8GA5AG29AG9AGCA3AT19AGGC1TA12AG1GTAG1GT3-A1AC3TA1-T-G-A-G-T-C-C-G3CT3TC9AG3AG1AG6AG3TC12AG24GA13AG2AG19AG20GA11AGAG2CA8AT8AGAG6AG8CAAG10AG8GC2GA2AGGA9AT11GA1GT1CA17AG20AG21TC18AGAG5TC18GA10AG12CA16AG2AGCA4AG9AG20AG9AG4CGGC6AGGA3G-G-C-4C-A-A-A-A-2TCA-C-A-A-A-A-G-3AG2TAGC1CG4AG1GA2AC3TC5AG3AG4AG3AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG3AG24CA11AG11AG5AG4GA5TA2CA1AT18AT25AG3AG39AG9AG5CT11AG10TA7GA7AG3GC14AG11AGGA4AG12AG2GA7GAGT17TC3AG10AG9AG8AG26CA17GA1TCCG1AG15AGAG6AG1AG3AGAG16AG2AG9GA5CT1AG27CT11CTAG7TC4TC9AGAG9AG1AG1AT6AG2TG5AG2AGTC1AT8TA3TG12GA17AG4AG1GACT13AG24AGAT1GA2AGAG2AG1ACAC1GA1AT2GA1AGAG8AG2A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-A-A-G-A-23AG3AGAG11AC7AG6TC8CA1TC7AGGC14TC7AC24AG6G-A-T-5AG13GC7TG13CA8TC2AG6CG7GT39GA2TC9AG3GA41TC10GA22AG2AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT4AG18AG7CT3TA6AG14CA12AG11ACAT11TA2AT3AGGA11AC6TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 -MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9719,558,9120,9663,1,558,4.74e-171,599,87.993,491,plus,11GA2TC8ACAG3GA41TC10GA22AG13CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT4AG1GA16AG7CT3TA6AG14CA24ACAT11TA2AT3AGGA11AC6TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 -MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9719,9071,541,9544,577,9625,0.0,10835,92.129,8357,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG1AC2A-2GA1TG1CGCATA1CGTGCGCA2TC1TACG2CG10GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9719,542,9012,9544,1,540,3.24e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9719,8890,661,9500,755,9626,0.0,10711,92.463,8220,plus,3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG81A-T-G-G-G-21AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC13GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 -MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9719,544,8966,9500,1,541,1.71e-174,610,89.890,489,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 -MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9719,99,9492,9589,4443,4345,9.70e-29,126,94.949,94,minus,4GT7GA36AG20CT9-A18 -MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9719,9088,581,9617,577,9627,0.0,10868,92.221,8381,plus,26-A1TC2ATGTCT3GCGACGGTCGCTCG3C-A-G-21G-G-A-C-T-C-T-G-G-T-3T-2AG2T-3C-A-C-TG3TG1T-A-1CA1GATG2CAGACA1GC7A-8GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9719,544,9083,9617,1,542,1.19e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 -MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9719,9069,479,9485,577,9625,0.0,10895,92.370,8377,plus,25A-C-TG1ACACTCCT1CT3-T5CT1C-C-C-3CA1G-G-G-AT40TGAG20GA29AG20-A-C-T-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2GT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA24GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA29TC5TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTTA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA13GT4AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 -MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9719,542,8953,9485,1,540,6.15e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 -MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9719,9072,349,9353,577,9625,0.0,10877,92.284,8372,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG2TCAT2G-1TACG1CGTACA1AGAGTGCA19GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9719,542,8821,9353,1,540,8.37e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,8943,204,9098,747,9608,0.0,10376,90.876,8127,plus,2GT2TG1AC15TC48CG2CA8CTACAG27AG4GA4CAGA45CA8CT2CT29CT1AG7AC7AG2CA6GT50GATC12AG5GA8TGGA4GA2TC5AG14AG32GAAG14G-C-C-12AC3AG2GACT2AG17CT14GC5AG26CT5CTCT20AG13AT14AG18CT7GA92GA32GT5AG3GA16AG2GA55CG10CA10CTGA16CT18TC5CT16GA12GATC7TC58GA11TC17AG6GAGA51CT22GCAG38GA9AG13GA8AT16CT4GAGA1GT2CGAC1GA27AG14CT9CT23TC1TC29GA42CT2CT29AG12CT13GA8CT35G-G-A-G-A-G-C-C-T-C-A-G-G-C-C-A-A-C-A-G-C-C-C-C-A-C-C-A-G-T-14TC5AT7GA2GA1CT3TCTC12AG4GT9GAAC3CA3CT3GA9AGAG19ACGC1AC24AC19CT33GACGGT75GCCT9TC14AT2TA32TC17AG38TC8AG14GA27AG58AG14AG14AT27AG31GA80TC5AG18AG25CA26AC32CT81TA16AC29AC23CT56AG2AG3GCGA11AG6GATC28GA43GA19AGAT9GA5AC1TG33AG8CT23AG10AGAG20GA12TC58AG39AT7AC23AG11GA56GA53GA6TA1TC44AG25TC12CG40GA3TC6CT4AG66TG4TC30AG5GA1CT14GA13AC9CA5AG5AT15CTTA6AT11AG10CT9GA45AC21GA34AG4CT3AG16TC20GA21AG4GA2TC9TC21GA9AT2GA7GA36CT68TC12AG25GA14CT12AG82CT3AC1CT41AT21AG2AG1CT2AG4AG21GAGA16TA17GA11GA32AT11CA50TC59TC45TA13CT27GA28TC20GA11GA41AG17CA60CA30AGAG4AG3AG27GA3AC9AG37GAAGGA6GA17TC4GTCA4GA5GA38AG3GAGA9AC5CA2GA6AG1CA24CT10TC11AC12CA1TG3AT10TC1GT54GA22GT1GA37TG5AG53TC28AG2AG6CA1GT11GA12CACTAT5TC3AG11TC34GA20GT20TC2-T17AG16AG3TCCT1CG22TG13AGCA35GA10AC25CT21CT1CAGC5GC35GA1AC5GA2TG3TA1AC1AGGAGA1CA5GA9ACCT31TC1TCTA1TC2TA1A-G-A-1GCTC13AGCT16GAGT22AT8CA1TC40AG1AT2CA8AC3GT33G-G-G-G-G-A-T-C-3A-4TA1GA5GA14-G-G-T1CG1CG1ATTG1CGTG18AG2AG5TCAT3AG10CA34AG5AG8AC11CT90AG1GA5AGAG46TA2AG5AT5CT3GA4CT52CGCT5TG6AG5A-C-C-A-T-T-G-A-G-C-C-A-2CG4CA6ATGA6TG4-A-G-C5-A-A-T1TA2GAAT2GA9AG2GA1CA16GA3CG7CA6AG4AGGT1AC14CT1CT15GA2GA2GC3CT2GA1GA1ATAG3AC2AC5TA2GA5TC9TC7ATGC26AC5AG47GA6GA4AG1AC16ACAC5ACCA10TC82GA9CT7TA1AG6AG4GA22AC1AT6TA33-A-A-AGA4-T-C-C4AC2TG1TG2CG16TGAT1GA3CT4G-A-T-1TA7GA4AG3AC21AG2AC1GA1TA7CA9CA3GA1GA4AGAC6CAAG11-G-A-A1GT3GACA7GAAT6AG1CA29TC40AT4GAGC4AG3TACA1TA1GT1-CAT2CG1ATCT2CT1AGAT3-T-G1TATG4T-G-3TG1CG1A-6GA2AC1AG1TA3-A-G-T-G-A-C2CA4TCAC8TC29AGGA1GA29TCCA19GA14AG23GT1CA2A-C-1GCGA3GAGT2A-C-A-G-1ATACTC4CT15GA3AG6AG30CT9GA5AG65AGCGCA9AT14CT4GA26AC3CA46AG12CT10GT11GA32AC2AG15GA16GA7GAAG26CT17CT9AG14AGTC14GA1AT5AG1TAAC1CG6GA1CTAC1TCTATC3TC6CG7TC1CG20AG1ATAT4TC2CTACAC3CA4GA3GT4GA8GA43AG16GA5TA4CT11CT6AT8TA1AG14AGAG20AG37CT22GA1TC5GATC29CTCA36GAATCTAC15TC4AG12TA7AC94AC18GC4GA2AG41AC16TC22AG8TG3CT4AG2AGTC9-T-A-T-T-C-G-C-C-A-C-A-T-A-C-C-T-A-G-A18AG5CA33CAAG4AGAT2GT2AG4GC2GAAC16GACG2AG1AG5GC11GA12TC9TC7GA31AG3AC15TC43AC9GA5GA11CT7GC4TG44TC5TC1TC7AG9CT15GA5AC24GA24AGAGCT5TACT6TAGC14TA18TG9GA1GA5AG19AC16AG19GT3AC1CG8GA6AGTA5AG30AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT22AG1G-G-G-A-G-G-C-G-T-G-A-C-11-T22GC21CT3TC5GT47GA6GA15 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,535,8565,9098,1,523,1.26e-164,578,88.037,471,plus,8TC5TC1TC6ACAG9CT15GA5AC24GA24AG1CT5TACT6TAGC14TA18TG5TG3GT1GA11TC13AC16AG13GA5GT3AC1CG8GA6AGTA5AG28GA1AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT12G-G-G-A-G-G-C-G-T-G-A-C-10AG12-T22GC21CT3TC5GT47GA6GA15 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,161,1,161,4772,4612,1.47e-54,212,95.652,154,minus,48GT11TA32CT11CT17AT16CTCT19 -MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9719,51,160,210,649,699,2.00e-12,72.5,98.039,50,plus,18AG32 -MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9719,9115,49,9137,649,9681,0.0,9873,88.195,8039,plus,18AG41-A23CG9AG11GA3TA11AG20AG26CG12AC3AG10TCAGCGCT11AG15GA48CT2CT12AG1GATA13CT2GA5TA2AG15GT44AG5GATC12AG7AG4AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC2AG8AG8AGCG27AG10AG28AG18CT50AG1AGAG19GA11AG11TG13AGAG6TG19CG22AGGA8AGAG19CT24AG3AG36CT10AG10AG1GA16AG13GATC7TC14AG18AGGA2TC28AGGA2TC2AG5GT8TG10AG18AG14TC14CT14AGAG7AG6TC46CT41GT5CTTA8GA4AGGA10AT1AG14AT30AG10AG17AG6AG7AG13AG26AG20AG7TC9CT14AGAG9CT26GA4CA14TC1AGAG2AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG3AG1AGAG10AG39AG7AG1AG11AG2AG12AG4AGAG6AG32GA3CT4AG4TC3AG14AG11AG2AG10AT12AG16CT3CA2AG22CT2TC8AG29AG3AG43GA6AG11GA4AG2AG5AG3AG8AT8AG5AG1GA8TC11GA31AG19CA13AG5AT8TC1AGAGAG8CT2AG49AG5AG23TC5CTAG10AG23CT15GA5AG1AGGA28AGAG3AG61GC31AG15AG18AG6CT14AG2AG17AG1AG2AGAGAG4CT38TC4AG3AGAG17AG23CGAT9CA10AG27AGAG1AG2GA2AG4AG6CT5CT2TC4AG11AG22AG23GA42AGGA24AG3CTAG33GA13AGGCGA2AG24GAAG23AGAGGA13CT3AG26GA24GA2CATC4GACG11AG1AG22AG2TC8AG7AGAG4TCGA1AG2AG23AG11AG3AG5CT17AG7AG28AG10TC12AG10TC2AG12AG8AG1GA8GTGA1CT3AG17TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG5AGAG1TC2CT7AGAG2CA12AG5AG2AG29AGGC1AG7AG12CT5AG10AG8AT8AG16AGAG68GA6TC5AG5CG1TC60AG5AG7AG21AG4CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG4AG4AG11AG2AG3AGAG1GA9AG5AG1TA14TC32TA28AG48TC18AG24AG10AG35CT14TA18AG22GA1AT31AG39TC33CA52AG21CA21CT2AG5AGAG7CAAG1AG4AGGT4CT9CT9AC1AC6AG2CT22TC2AG4AT2AT5AG7AC8AGAG32AG2CT8AC46GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6GC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG13AGGA2AG16CTCT12TC4CT2TC2-T10AG6AG9GA3AG1ACAG3TC22AG16AGCATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC13CT35TCCA3CG1GA8AC9GTGT5CT2GA11TG9TC3TAGC1CTTA2GCAC5CT10AGGC13GACT20AG3TC6TA1AC10AG6TA10AGGA24AC3GT27AG5C-G-3A-C-C-A-G-G-A-4TA8AC4AG5AG-G-G-G-G-T-G-G-A-G-A-T-G5TC1TA2TC5AG4AGGT7AC8CT1-C-A-G1CA2CA4AG17AG9AG5AG8TC36AG1GT6AGATGA14AC2CA25GA6GA7CT3AG1AT14CAAT29GA28AGAG23GA3CT18CG6TG9G-A-A-2AG2TGC-T-A-3TGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-2ATTG5A-T-G-A-C-3AGGA7AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT12GA2GA11G-2AT1T-A-G-T-G-G-A-A-7ACGA2A-A-A-4GA1AT3TC2AG24AG40TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG7AG4GA6TGAT2GC2CT2AGCA1TA7GA4AG8GA17GAAGAC1GA1TA1AG4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA7TG12AGAG9GA2AT2GA1TC3TC12AG3AGAG18AT7GA16AG1ATAT5AG5AG2A-T-G-7TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGAT2GA35GACT2GATC7AG2AGA-G-A-1CTA-A-C-5TC1GATC5TGAT1ACAG3CT6GA3AG2AG12AG8AG30CA15AG2AG11CA1TG22AG13AG1AG3CA1TAAG7CG6AGAG6AG20AG8GC3GA52AG14AG40AGAG24GA8TG1AG14AG15AGAG6AG9AG20AGAC6CT1AGAG4TC5AG3C-C-C-1A-G-A-T-A-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AG3AC1AG7GA7TC3GAAG1ATCT4TC1TCATAC10CG4AG2GA5AG6CA13CA5AG1CA9GA1AG11AG5AG4GA4TA3CA1GT5AG1AG10AT17AG8AG2AG17AG2AG4GT24AG4CT8GA2AG2GT7TA11AC22AG3CT8GA4AG6AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC32GAGA10AG8AGAG7AGAGAG2AGAG5AC2GC2GA7AG9GA7AG10AC13AT14CTAG7AC14AGAG9AG1AG11TG5AG3GCCT1TG11TG11CG1CA16AG4AGAGGACT13AG3AGAG5TG5GA3GTCATGCTAGGT1GACT1AG8GA1CTAG3AGAG13AG4A-G-G-C-C-A-G-T-A-A-G-A-A-A-G-C-C-A-12AGCA2AG3AGAG19AG4GA10CA1TC31AC1GTTG6CG12CG4AG2AGA-A-A-5AG13GC18GA14AG1GC4CG5AC34TA9TC5AC13CT15CA5AC22CT1GA16AG7AG7TA7TAGCTC3AG9TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG7AG1AG2AG2AT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 -MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9719,597,8541,9137,1,596,0.0,658,88.610,529,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA16AG7AGGA6TA7TAGCTC3AG9TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG7AG4AG2AT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 -MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9719,9027,371,9347,622,9625,0.0,10818,92.279,8330,plus,27AGAGAGTA1T-2A-1CA1G-T-G-G-CA2CGCAGA1AGCGAG2TA1T-3C-3GA9GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9719,542,8815,9347,1,540,3.18e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 -MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9719,28,91,118,622,649,0.002,42.5,100.000,28,plus,28 -MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9719,9048,269,9266,600,9625,0.0,10863,92.352,8356,plus,5TC2GTGT2AGCTTC2AT1ATTGCGCA23C-TA1TA2TG1AC2A-2G-1TACG1CGTACA2TG4T-C-T-1TC2C-13GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC2-T7CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC6TC7CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA31CA17AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC24GA25AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9719,542,8734,9266,1,540,6.01e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 -MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9719,73,220,271,577,649,8.11e-04,44.0,71.233,52,plus,24-A-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T-G-G28 -OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9719,9720,18,9686,1,9574,0.0,11694,92.407,8982,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA164-G1TG5GA12TC31AG25CT82GA3AC97CT3AG14GT20TC8TC7GA28AG16TG35GA19CT5GC26CT8GA19A-C-A-C-A-G-G-A-A-A-C-A-G-C-A-G-C-C-A-G-G-T-T-A-G-A-C-8AC6GACT26AG6CA1TC89AG50TC11TC75CG1AG20CT76CG11GA27CT41GA8TC93AT70CT20AG41GA8AC5AG29CA12AGGC1GA16GA11AG12GACT27GA5TC1TC5AG99AG12CT4AG20CT24C-C-A-13TG8TC2TG2AT16TC7AG8AG17T-C-C-7GA9AGAG46GA26GA23CA4AG3AG73CT117TC8AG101AG14AG119GA69TC38AG37CT86TC22AT5CA2GA9AC2GA26AG29AG6GA13AG19AG7TC4TC2CA17AG26GT48AG1CA32AGCT7AG5AG32GA4AG21GA24GA4GA18TC19GA26GA51GC4AC10TA52GACT55GA8GA19AG1TC11GA3AG77CT2CT14AG47TC29AG6ATAT22GA1CT21TA10TC33CT19AG35CT5GA24AC21GA12AG5GA20CT59TC21TC19GT107GA23AG8GA27TC26AG49CT11GA20CT5CT41AT21AG2AGAC8AG21GA17CA203CA5CT6CT15TC40GA28TC26TA126CA30AG9AG23TA7ACAC8AG27GA1AG10CT61GA50CA26CT8TC11AC14TG3AT19TC47GA37GT9CT13AC3GA2AG5AG47TC14TC24GA27AT9AG11TC19AG14GA33TC7TC2-T17AG16AG3TC40GA34GAGA13CA3TC11AG2CT25CT8GC43CA6CA3AGGA11GC6GC1CT5CT24TC7TA2AC5TG14CT11GACT4CA26CA31GA24AC3GT27AG5G-G-G-G-G-A-T-C-3A-4TA10-T-G-T-G-G-A-G-A-T-G-G-G8GT6TC1TA10AG16AG10CAA-A-C-10TC29AG7AC37AGGA66GA5AGAGAT21TC6GA5AG22AG27TC16GA5TC13CG1CT4TG3-A-C-T-G-A-T-T-T-G-A-A-G-A-A-T-G-A-T10CA3GT5TC2AG1-G-A-A-T-G3CA1-G-G1CGCA2TG2AG-A-G2GA15TA3CT1GAAGAC3GAAG8AG4AGAT1-C5G-9CT8GA11GA4CA6GA1GT4AC2ACGC1A-T-A-A-G-A-G-T-A-A-T-A-A-T-A-T-T-A-4T-T-C-2GA3AG1TC6CT11TC8AG71GA6GA6ACAG14GA23GA14TA53CA13AG4AGGT10AG28AG2TCGAAC1AT5AG40TA2AC1CG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA1CT2AG20CTTACG9CA4CAAT21GAAGAC6GA2AG9AGGAGA1AT12GA7TG1CACA20GAGA6TC16AG30CA19ATATG-G-A-G-A-C-4GA1GT1TC5C-T-C-3TC2GA2AG7GA1T-A-G-T-G-C-T-A-C-T-A-T-C-A-4AG2TG2T-5TC2TA5AC4AC3TC1AG5GAGA12TA8GA33AGAT11CA4TC6CT18GATC12CT4AG2CAGC2CT1GA1AT18TG9AT76GA27GA8-A-G-T1AGCG1TA1GA6CT46GC3GA24TA21AG20AG66GA24GA45CT9AG14AG26AC1AG9AC1TC1TC18AC9GA20TC2AT5CA13GA14AG6AC21CA25GA10CT18AT14AG32AG37CT14CT4TC5CT4GA1TC29CA4GA31GAGT2CG14TC3AG6TA6TA3CT57GA40TC8CTGT6GA9AG8CT23CT11CT45AG2TG5AG18TG3TC7CG25GACT22AG13AGGTCG1AGTA11GA20AC5G-A-G-C-C-A-G-C-A-G-C-A-15GA30GA3CT24CG2AG37AG25GC33AG2GA61CA2AG9GT15GA4TC2TC8TC1TA11GA1GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 -OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9719,663,9,671,9077,9719,0.0,789,91.855,609,plus,3TG2CGTA22CA2AG9GT15GA4TC2TC8TC1TA11GA1GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA133 -OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9719,509,9178,9686,1,489,3.68e-161,566,89.194,454,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 +MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9718,9070,480,9481,576,9624,0.0,10871,92.271,8369,plus,26-G-A-C-C-C-T-T2-A-G-T-C-A-G-T-G-T-G-G-A15C-3A-1ACTC2G-G-C-TA1GA1TGAG2TCAT2GA1TG1CGTACA2TGAG2TA17GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115527.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9481,9718,542,8949,9481,1,540,8.48e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9718,9034,70,9055,648,9620,0.0,10451,90.779,8201,plus,19AG41-A23CG21GA3TA59CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA69GATC9CT2AG12AG1TGGA20CT6CAAG11AG20GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG13CA23GAAG28AG18CT73GA11AG11TG2GA18TG19CG23GA29CT36CA3CA24CT23GA30GATC7TC34GA2TC8TC20GA2TC8GT8TG59CT14AG8AG6TC31GA2GA11CT47CTTA8GACT3AGGA21AG2GA2AT30AG4TC50GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA21GA10AG20AC1ACAG1ACTA6GAAG5AG11AG49AG11AG61GA3CT9TC30AG13AT29CT3CA25CT2TC8AG40GA27CA8GA6AG11GA4AG21AT16GA8TC11GA51CA19AT21CT30GA21AG29TC5CTCG10AG23CT15GA7AGGA94GAGC66AG6CT17AG18GA10CT38TC51CGAT9CA41AG2GA14CT5CT2TC16AG21GA24GA43GA20CA7CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG33AG13TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA6CT19AG4CT1AGCA30CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGAC9AG3AG8CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC1CA26CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC32TA77TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA25AGGACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT24GA23CT15TC2AG21GA2GT9CT5CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG10GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA20CT12TC4CT2TC19AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CTCA7GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2ACAC5CT11GC14CT24TC6TA1AC17TA11GA24AC3GT27AG5CA5CACA-T1GTGC2GC1AC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT4AGAT14CAAT29GA53GA3CT18CG6TG9A-G-2TG3-A-A-T-G-A2AC6TC3TAAG2AG1-A-G-C-G-G-G-A-G-A-A-T-G4CT3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT4GA7GA2GA2TC8GA1AT4G-T-G-G-A-A-A-T-A-4GCGA2A-A-A-4GA1AT3TC2AG24AG12AG27TA30GA4GAATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC1CT5AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG19TGAT1GAGC2CT2AGCA1TA6GAGA4AG8GA15GA1GAAGAC1GA1TA6GA11ACA-6TC2TGAC7AG4AC6-G-A-A1GT12GA7TG23GA2AT2GA1TC3TC36AT7GA18-T-T-T3GA5-T-G2TGAT1TC2G-2TG3-C-A-A-A-T-A-A-C6TGCG2AG1AG4TA5AC30TA8GA9GA12TC9CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CTAC5GA59CA18AG11CA1TG20AG2GA18CA1TA8CG44GC3GA52AG14AG66GA8CG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8GT1CG7AC1AGGA6GA11GAAG1ATCT4TC1TCATAC10CGTA3AG2GA5AG6CA13CA7CA9GA16GA7GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC27AC7GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11CG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT10GA1CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA10TA5GC4CG5AC34TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG3TG5AG5GT3GCACAGCG1CG8AG2GACG16TC18AG22AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 +MK114997.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9055,9718,537,8519,9055,1,536,6.00e-175,612,89.944,483,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG3TG11GT3GCACAGCG1CG8AG2GACG16TC41AG2TC6GA10CTTC3AC2TG31G-23AT22GC21CT93 +MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9718,9022,565,9537,623,9624,0.0,10905,92.596,8354,plus,26A-C-T-C-TG4T-13TGAG20GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9718,542,9005,9537,1,540,6.18e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115518.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9537,9718,28,370,397,622,649,0.002,42.5,100.000,28,plus,28 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,8983,200,9165,768,9675,0.0,10441,90.927,8168,plus,51CG12AC14TCAGCGCT27GA48CT2CT14GATA13CT2GA5TA18GT50GATC9CT2AG4CA7AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC20AGCG2TA35AG28AG18CT73GA11AG10CATG2GA18TG19CG23GA29CT36CA25TA2CT23GA30GATC7TC34GA2TC29GA2TC8GT8TG44TC14CT14AG8AG6TC31GA2GA11CT41AT5CTTA8GA5GA24GA2AT30AG10AG44GA57TC9CT25CT26GA4CA14TC5AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG5AG11AG49AG11AG65CT9TC30AG13AT29CT3CA25CT2TC8AG40GA36GA6AG11GA4AG21AT16GA8TC63CA19AT21CT52AG29TC5CTAG10AG23CT15GA7AGGA94GAGC55TC10AG6CT17AG18GA10CT38TC51CGAT9CA15AG25AG2GA14CT2AG2CT2TC16AG21GA24GA43GA28CTAG33GA14GCGA2AG51GA13CT30GA24GA2CATC4GACG36AG2TC22TCGA44AG5CT17AG47TC23TC2AG23GA8GTGA1CT14GA6TA6TCGT16GA12CA2TA3CT19AG4CT1AGCA12GA17CA5GA21AC1GA19GA16CT17AG1TC2CT11CA51AGGC9AG12CT1GA23AT8AG86GA6TC11CG1TC41GA24AG34CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG9AG18AG2GA17TA14TC110TC54AG35CT14TA41GA1AT71TC33CA74CA21CT2AG5AGAG7CAAG1AG5GT4CT19AC1AC6AG2CT22TC7AT2AT13AC45CT8AC19GA26GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6TC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA14AG9TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG14GA19CTCT12TC4CT2TC19AG9GA5ACAG3TC40CATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC49TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2GCAC5CT11GC13GACT24TC6TA1AC17TA11GA24AC3GT27AG5CA2GA2CACA-T1GTGC2GC1GC2AG1C-A-1CG1CGTA1-G-G-G-G14TC1TA2TC11GT7AC8CT1-C-A-G1CA2CA32AG5AG8TC38GT6AGATGA14AC2CA25GA6GA7CT5AT14CAAT29GA53GA3CT18CG6TG9A-A-2TG2AGT-C-T-A-3CGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-3TG5A-T-A-A-C-3AG8AG21GA3CG4GA1AC7AG2GA4ACCAAG6CT5CT4CT12GA2GA11GA1AT1G-T-A-G-T-G-G-A-A-7GCGA2A-A-A-4GA1AT3TC2AG24AG40TA30GA5ATGA6ACAG15GCAC5GC61CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG12GA6TGAT1GAGC2CT2AGCA1TA7GA4AG8GA15GA1GAAGAC1GA1TA6GA18TC2TGAC7AG4AC6-G-A-A1GT12GA6CATG23GA2AT2GA1TC3TC36AT7GA18ATAT14A-T-G-7CAAGAGTG1GCGA3GAGATC6TGCG2AG1AGGA3TA5AC30TA8GA9GA22CAAGAT2GA35GACT2GATC12GTA-G-C-A-A-C-5TC1GATC5TGAT1AC4CT6GA59CA18AG11CA1TG20AG2GA12AG1AG3CA1TA8CG44GC3GA52AG14AG66GA8TG71AGAC6CT6AGTC9C-C-C-1A-G-A-T-G-G-4GA6AG2TAGC9CA1AC3TC8AT1CG7AC1AGGA6GA11GAAG1AT5TC1TCATAC1CT8CG4AG2GA5AG6CA13CA7CA9GA24GA4TA3CA1GT5AG12AT26AG20AG2AG4GT29CT8GA2AG2GT7TA11AC27AC7GA20GA2CG5CTGTAC8CA1TC4TC3AG5CT11CT13TG9TC31CTGAGA40AC2GC2GA17GA18AC13AT14CTAG7AC27AG11TG5AG3GCCT1TG11TG11CG1CA16AG6GACT17AGAG5TG5GA1GA1GTCATGCTAGGT1GACT12CTAG7GA15A-G-G-C-C-A-G-T-A-A-G-A-G-A-G-C-C-A-13CA1GA30GA10CA1TC31AC1GTTG6CG2GA9CG8G-A-A-19GC18GA16GC4CG5AC34TA9TC5AC13CT15CA5AC22CT26AG7TA7TAGCTC13TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1AT2AG9AG5GT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,592,8574,9165,1,591,0.0,690,90.878,538,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA24AGGA6TA7TAGCTC13TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1AT2AG15GT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTC3AC2TG31G-23AT22GC21CT105ATTC41 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,129,1,128,778,650,1.18e-41,169,96.124,124,minus,19AT3CT21GC23-T41TC17 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,72,130,201,623,694,1.90e-21,102,98.611,71,plus,44AG27 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,48,9167,9214,463,510,5.46e-12,71.1,100.000,48,plus,48 +MK115065.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9214,9718,48,9167,9214,9547,9594,5.46e-12,71.1,100.000,48,plus,48 +MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9718,9067,648,9663,640,9642,0.0,10107,89.324,8099,plus,27TGAGGA62AG22-A-A-A13AG20AGAG13TA24ACAG27AG10GA57CT2CT5TG9AT7AC4AG11AG6GA13CA29TA31AC1GA2AG6GA2CA16CT5AC8AG26GA8GA4TC8AC4ACGATC1CG2GACT20GT12CA31GA19AG3GA20CT2TC8GA2AG23GA95GA10AGAG30GA75CG2AG8GA27CT20AG11GA30TC9AG49GATCCT17AT8TG10AG15AG2AG11AG32AGAG7AG2AT35GA17AG42AGAC2TC41CT28AG6TC100AG18CA3AG9AG4CT52TC1AG3ATGA6GA7TC18GA1GA5AG3GC11GA9AGAG40AG5GA35CT17AG16AG17AGAG11CT30ACCTTC68CA6TC14AG4TC20TC8AG12CA7AG8AG3AG67AG8AG3AGAGAG2GA12AG61AG19AGGA11AG16AGAG12AG10CT6AG13GA6AG10AG5AG18AG11AG9AG33TC3AG9AG35AG4AG30TC24GA32AG5CT9AG17AG25AG11CTTC6AG2AG1AG2TC1GT11TC20CT8GT5AGAG52CA5TC27CT4AGAG1AG11AG14TCGC3AG9GA2AG19AG4GA7GA11GA4AC38AG3AG22AG36GATA11AG10GA50GA10CT3AG3AG64GA5AG8CT4GA9AG8GA2AG7AGAG2TA2CA1AG9AG16AG6CT4AGAG8CT25AG6AG5AG5GA2TC2TA14TC12AG10TC1AGAG12AG21GACT14GA6TA31AGCT1GA10GA6AT11AG39CT2AG4AC18AC1GA12AT46CT2TG4AG16AG5AG2AG32AG13CA12AG19AT2GA3AG12AG5AGAG45AG13TC11CT9AGAG8CT4AG20AG11TC34AG21AG31GA8AG11CT2CT2CT17GA1AG6GA3GA10AT8AC1CG10AG12AG11AG2AG3AGAGAGGA13GT3CA25AG45AG35CA93CA19GA46AG4GA25AG2TC2TC79AG61CA32CTAG5AGAG6CTCAAGAG28AGTC35GA34AG33AG5AG19AG1GA3GA2AG16AGCA6CA20CT8TC5TC6GT4AC12GA5AT10TC1GT6TC47GA12AG8GA15CT21GT2AG51AG7AC22CT5AG10GAAT25CTAT5TC11AG22AG10AG7AG1GA4TA31TC12AG4CT1AG16AG1CT24AG18TC34GA3CG10AT14AG2CT25CT8GC46CG3CA3AGGA18TCATCT5CT9GA7TC11TC2TA2TCACTA3TG2AG23GACT4TA15AG1GT8CA12AG11AG6GA1GA6TC15AC7TA1AGGA32TACAAT1GT-C2GC1GC2AG1CGAGGACG2TGTG-G-G2AG5AG5TC10AG1AG13AG4AG2GA4CACA1GA1GT19AGAG14GAAG7AC37AGGA8CT11AG43AG5AT1AG1AT6AG6GA16GA3AG10TA28AG9TC14GA3CT18CG6TG2TC6AT1TG1GA4AGGA3CTGATA3TCTACA2AG2CG2CGTCTGCGTG1-G-A2AGCA2CA1TG-G2-A-A-A5AG2GA1CA7AT12CG11AGGA1AG4AG1AGAC1AG6GTCAGT3CT11AC5TA2GA2GCAC7G-A-2AT2A-A-A-A-T-A-A-C-A-G-2GC6AC4GA5TC2AG14CT9AG5CT15AG18TA13AG7AG8GA13AC5GA5AC27GA12AG6AG55AG1GA10AT4AT4AG6AG6AC13TC4ACGAAC1GT1CTAG2CGGA4TATACT4TC27TA2ACACAG3-C-C-A-G-A-G1AG7AG9TGAT5CT4GA1T-A-T-4AG2GA1CT2AG2GA21GA1-A-G-C3TA4GA23CGACCA5GA2AG5CT-T2AG1TACAAT2CT1CA3A-12TGTCCA4GT5AGAG9GA8AG18AGAG1AG4CT5TC9TA2TCCA15CT1AG1ATCT3AT1A-T-G-5GTAGTG3TAGC-T1CA1-G-G3TA3GA1TC3CG1GAAGAGTA3AG1TC-A-C-A5AC4AC25CA8GA5AG29AG9AGCA3AT19AGGC1TA12AG1GTAG1GT3-A1AC3TA1-T-G-A-G-T-C-C-G3CT3TC9AG3AG1AG6AG3TC12AG24GA13AG2AG19AG20GA11AGAG2CA8AT8AGAG6AG8CAAG10AG8GC2GA2AGGA9AT11GA1GT1CA17AG20AG21TC18AGAG5TC18GA10AG12CA16AG2AGCA4AG9AG20AG9AG4CGGC6AGGA3G-G-C-4C-A-A-A-A-2TCA-C-A-A-A-A-G-3AG2TAGC1CG4AG1GA2AC3TC5AG3AG4AG3AC1AG7GA20TC2AT8AGCA6AG2TATACA3AG3AG24CA11AG11AG5AG4GA5TA2CA1AT18AT25AG3AG39AG9AG5CT11AG10TA7GA7AG3GC14AG3TCAC6AGGA4AG12AG2GA7GAGT17TC3AG10AG9AG8AG26CA17GA1TCCG1AG15AGAG6AG1AG3AGAG16AG2AG9GA5CT1AG27CT11CTAG7TC4TC9AGAG9AG1AG1AT6AG2TG5AG2AGTC1AT8TA3TG12GA17AG4AG1GACT13AG24AGAT1GA2AGAG2AG1ACAC1GA1AT2GA1AGAG8AG2A-C-G-A-G-C-T-C-A-G-C-C-A-A-C-A-G-C-A-G-A-T-A-A-A-G-A-23AG3AGAG11AC7AG6TC8CA1TC7AGGC14TC7AC24AG6G-A-T-5AG13GC7TG13CA8TC2AG6CG7GT39GA2TC9AG3GA41TC33AG2AG10CA19TA13CG11CA2GA14GA12AC4CT11CG6AT4AG18AG7CT3TA6AG14CA12AG11ACAT11TA2AT3AGGA11AC6TG1CT2CA11AG-C-T-G-G-G2-C-T-T-T-C-C1-G-G12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 +MK115464.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9663,9718,558,9120,9663,1,558,4.74e-171,599,87.993,491,plus,11GA2TC8ACAG3GA41TC10GA22AG13CA19TA13CG10TGCA2GT7GA5TCGA12AC4CT11CG6AT4AG1GA16AG7CT3TA6AG14CA24ACAT11TA2AT3AGGA11AC6TG1CT2CA11-G-C-T-G-GAG2-C-T-T-T-C-C-A-GAG12AG3AG4CT1AGAG19GC7AT10-T13AG9AG20AG11TG7AG44TC8 +MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9718,9070,541,9544,577,9624,0.0,10845,92.161,8359,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG1AC2A-2GA1TG1CGCATA1CGTGCGCA2TC1TACG2CG10GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115530.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9544,9718,542,9012,9544,1,540,3.24e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9718,8889,661,9500,755,9625,0.0,10721,92.496,8222,plus,3CACA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC6AG12TC1TA2AG6TC1CA52AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG2AG14AG81A-T-G-G-G-21AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC1GT6TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT8CT37AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT67GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC7AG4AG17CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT19AG6AG12GA35GA22GA52GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT32TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC1TC4TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-A-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC10AC39AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA7GA6AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 +MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9718,544,8966,9500,1,541,1.71e-174,610,89.890,489,plus,14TC8ACAG18CT6GA5AC10AC13GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA7GA6AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT83T-5 +MK115520.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9589,9718,99,9492,9589,4443,4345,9.70e-29,126,94.949,94,minus,4GT7GA36AG20CT9-A18 +MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9718,9087,581,9617,577,9626,0.0,10878,92.253,8383,plus,26-A1TC2ATGTCT3GCGACGGTCGCTCG3C-A-G-21G-G-A-C-T-C-T-G-G-T-3T-2AG2T-3C-A-C-TG3TG1T-A-1CA1GATG2CAGACA1GC7A-8GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115503.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9617,9718,544,9083,9617,1,542,1.19e-179,628,90.809,494,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT89 +MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9718,9068,479,9485,577,9624,0.0,10905,92.402,8379,plus,25A-C-TG1ACACTCCT1CT3-T5CT1C-C-C-3CA1G-G-G-AT40TGAG20GA29AG20-A-C-T-G-G-T-G-A-G-T-A2ACAC4TA24GA23AG14AG8GCAG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2GT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA24GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA29TC5TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTTA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA13GT4AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 +MK115570.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9485,9718,542,8953,9485,1,540,6.15e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC16AT22GC18GT2CT8ACGT87 +MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9718,9071,349,9353,577,9624,0.0,10887,92.316,8374,plus,25-G-A4-T-T-T-A-G-T-C-A-G-T-G-T-G-G-A27A-C-T-C-T-G-1TG2TCAT2G-1TACG1CGTACA1AGAGTGCA19GA29AG35G-A-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT10AG25GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT7CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA25AT9GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA5AG23GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AG19GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115509.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9353,9718,542,8821,9353,1,540,8.37e-179,625,90.775,492,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AG13GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,8942,204,9098,747,9607,0.0,10391,90.930,8131,plus,2GT2TG1AC15TC48CG2CA8CTACAG27AG4GA4CAGA45CA8CT2CT29CT1AG7AC7AG2CA6GT50GATC12AG5GA8TGGA4GA2TC5AG14AG32GAAG14G-C-C-12AC3AG2GACT2AG17CT14GC5AG26CT5CTCT20AG13AT14AG18CT7GA92GA32GT5AG3GA16AG2GA55CG10CA10CTGA16CT18TC5CT16GA12GATC7TC58GA11TC17AG6GAGA51CT22GCAG38GA9AG13GA8AT16CT4GAGA1GT2CGAC1GA27AG14CT9CT23TC1TC29GA42CT2CT29AG12CT13GA8CT35G-G-A-G-A-G-C-C-T-C-A-G-G-C-C-A-A-C-A-G-C-C-C-C-A-C-C-A-G-T-14TC5AT7GA2GA1CT3TCTC12AG4GT9GAAC3CA3CT3GA9AGAG19ACGC1AC24AC19CT33GACGGT75GCCT9TC14AT2TA32TC17AG38TC8AG14GA27AG58AG14AG14AT27AG31GA80TC5AG18AG25CA26AC32CT81TA16AC29AC23CT56AG2AG3GCGA11AG6GATC28GA43GA19AGAT9GA5AC1TG33AG8CT23AG10AGAG20GA12TC58AG39AT7AC23AG11GA56GA53GA6TA1TC44AG25TC12CG40GA3TC6CT4AG66TG4TC30AG5GA1CT14GA13AC9CA5AG5AT15CTTA6AT11AG10CT9GA45AC21GA34AG4CT3AG16TC20GA21AG4GA2TC9TC21GA9AT2GA7GA36CT68TC12AG25GA14CT12AG82CT3AC1CT41AT21AG2AG1CT2AG4AG21GAGA16TA17GA11GA32AT11CA50TC59TC45TA13CT27GA28TC20GA11GA41AG17CA60CA30AGAG4AG3AG27GA3AC9AG37GAAGGA6GA17TC4GTCA4GA5GA38AG3GAGA9AC5CA2GA6AG1CA24CT10TC11AC12CA1TG3AT10TC1GT54GA22GT1GA37TG5AG53TC28AG2AG6CA1GT11GA12CACTAT5TC3AG11TC34GA20GT20TC19AG16AG3TCCT1CG22TG13AGCA35GA10AC25CT21CT1CAGC5GC35GA1AC5GA2TG3TA1AC1AGGAGA1CA5GA9ACCT33TCTA1TC2TA1A-G-A-1GCTC13AGCT16GAGT22AT8CA1TC40AG1AT2CA8AC3GT33G-G-G-G-G-A-T-C-3A-4TA1GA5GA14-G-G-T1CG1CG1ATTG1CGTG18AG2AG5TCAT3AG10CA34AG5AG8AC11CT90AG1GA5AGAG46TA2AG5AT5CT3GA4CT52CGCT5TG6AG5A-C-C-A-T-T-G-A-G-C-C-A-2CG4CA6ATGA6TG4-A-G-C5-A-A-T1TA2GAAT2GA9AG2GA1CA16GA3CG7CA6AG4AGGT1AC14CT1CT15GA2GA2GC3CT2GA1GA1ATAG3AC2AC5TA2GA5TC9TC7ATGC26AC5AG47GA6GA4AG1AC16ACAC5ACCA10TC82GA9CT7TA1AG6AG4GA22AC1AT6TA33-A-A-AGA4-T-C-C4AC2TG1TG2CG16TGAT1GA3CT4G-A-T-1TA7GA4AG3AC21AG2AC1GA1TA7CA9CA3GA1GA4AGAC6CAAG11-G-A-A1GT3GACA7GAAT6AG1CA29TC40AT4GAGC4AG3TACA1TA1GT1-CAT2CG1ATCT2CT1AGAT3-T-G1TATG4T-G-3TG1CG1A-6GA2AC1AG1TA3-A-G-T-G-A-C2CA4TCAC8TC29AGGA1GA29TCCA19GA14AG23GT1CA2A-C-1GCGA3GAGT2A-C-A-G-1ATACTC4CT15GA3AG6AG30CT9GA5AG65AGCGCA9AT14CT4GA26AC3CA46AG12CT10GT11GA32AC2AG15GA16GA7GAAG26CT17CT9AG14AGTC14GA1AT5AG1TAAC1CG6GA1CTAC1TCTATC3TC6CG7TC1CG20AG1ATAT4TC2CTACAC3CA4GA3GT4GA8GA43AG16GA5TA4CT11CT6AT8TA1AG14AGAG20AG37CT22GA1TC5GATC67GAATCTAC15TC4AG12TA7AC94AC18GC4GA2AG41AC16TC22AG8TG3CT4AG2AGTC9-T-A-T-T-C-G-C-C-A-C-A-T-A-C-C-T-A-G-A18AG5CA33CAAG4AGAT2GT2AG4GC2GAAC16GACG2AG1AG5GC11GA12TC9TC7GA31AG3AC15TC43AC9GA5GA11CT7GC4TG44TC5TC1TC7AG9CT15GA5AC49AGAGCT5TACT6TAGC14TA18TG9GA1GA5AG19AC16AG19GT3AC1CG8GA6AGTA5AG30AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT22AG1G-G-G-A-G-G-C-G-T-G-A-C-11-T22GC21CT3TC5GT47GA6GA15 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,535,8565,9098,1,523,1.26e-164,578,88.037,471,plus,8TC5TC1TC6ACAG9CT15GA5AC24GA24AG1CT5TACT6TAGC14TA18TG5TG3GT1GA11TC13AC16AG13GA5GT3AC1CG8GA6AGTA5AG28GA1AG3AC5ACATAG18GA10CT1AG5TGTC1GA15GT12G-G-G-A-G-G-C-G-T-G-A-C-10AG12-T22GC21CT3TC5GT47GA6GA15 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,161,1,161,4772,4612,1.47e-54,212,95.652,154,minus,48GT11TA32CT11CT17AT16CTCT19 +MK115702.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9098,9718,51,160,210,649,699,2.00e-12,72.5,98.039,50,plus,18AG32 +MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9718,9114,49,9137,649,9680,0.0,9883,88.227,8041,plus,18AG41-A23CG9AG11GA3TA11AG20AG26CG12AC3AG10TCAGCGCT11AG15GA48CT2CT12AG1GATA13CT2GA5TA2AG15GT44AG5GATC12AG7AG4AG1TGGA13AG6CT7AG32GA5AG21A-A-2G-6C-A-G-CT33CA1AC2AG8AG8AGCG27AG10AG28AG18CT50AG1AGAG19GA11AG11TG13AGAG6TG19CG22AGGA8AGAG19CT24AG3AG36CT10AG10AG1GA16AG13GATC7TC14AG18AGGA2TC28AGGA2TC2AG5GT8TG10AG18AG14TC14CT14AGAG7AG6TC46CT41GT5CTTA8GA4AGGA10AT1AG14AT30AG10AG17AG6AG7AG13AG26AG20AG7TC9CT14AGAG9CT26GA4CA14TC1AGAG2AT4GA5GA20AC3ATGA3CA17GA10AG20AC1ACAG1ACTA7AG3AG1AGAG10AG39AG7AG1AG11AG2AG12AG4AGAG6AG32GA3CT4AG4TC3AG14AG11AG2AG10AT12AG16CT3CA2AG22CT2TC8AG29AG3AG43GA6AG11GA4AG2AG5AG3AG8AT8AG5AG1GA8TC11GA31AG19CA13AG5AT8TC1AGAGAG8CT2AG49AG5AG23TC5CTAG10AG23CT15GA5AG1AGGA28AGAG3AG61GC31AG15AG18AG6CT14AG2AG17AG1AG2AGAGAG4CT38TC4AG3AGAG17AG23CGAT9CA10AG27AGAG1AG2GA2AG4AG6CT5CT2TC4AG11AG22AG23GA42AGGA24AG3CTAG33GA13AGGCGA2AG24GAAG23AGAGGA13CT3AG26GA24GA2CATC4GACG11AG1AG22AG2TC8AG7AGAG4TCGA1AG2AG23AG11AG3AG5CT17AG7AG28AG10TC12AG10TC2AG12AG8AG1GA8GTGA1CT3AG17TA6TCAT16GA4AG7CA6CT19AG4CT1AGCA12GA17CA3AGAGGA21AC1GA19GA16CT10AG5AGAG1TC2CT7AGAG2CA12AG5AG2AG29AGGC1AG7AG12CT5AG10AG8AT8AG16AGAG68GA6TC5AG5CG1TC60AG5AG7AG21AG4CT18GC28CT3AC1CT8GA22TC9AT21AG1CTAG4AG4AG11AG2AG3AGAG1GA9AG5AG1TA14TC32TA28AG48TC18AG24AG10AG35CT14TA18AG22GA1AT31AG39TC33CA52AG21CA21CT2AG5AGAG7CAAG1AG4AGGT4CT9CT9AC1AC6AG2CT22TC2AG4AT2AT5AG7AC8AGAG32AG2CT8AC46GACA2GA17CT8TC5TC11AC11GA2TG3AT10TC1GT6GC17GA23CT15TC2AG21GA2GT15CT8AG3TC1AG8CT12TC6GA6AG7AG1AG7TC14TC7CT5AG2AG7GA12GA11AGCACTAT5TC3AG7AG3TC19AG13AGGA2AG16CTCT12TC4CT2TC12AG6AG9GA3AG1ACAG3TC22AG16AGCATC13AG14AG4TAGA10AC16CAGA24CT4CT2GC5GC13CT35TCCA3CG1GA8AC9GTGT5CT2GA11TG13TAGC1CTTA2GCAC5CT10AGGC13GACT20AG3TC6TA1AC10AG6TA10AGGA24AC3GT27AG5C-G-3A-C-C-A-G-G-A-4TA8AC4AG5AG-G-G-G-G-T-G-G-A-G-A-T-G5TC1TA2TC5AG4AGGT7AC8CT1-C-A-G1CA2CA4AG17AG9AG5AG8TC36AG1GT6AGATGA14AC2CA25GA6GA7CT3AG1AT14CAAT29GA28AGAG23GA3CT18CG6TG9G-A-A-2AG2TGC-T-A-3TGGACTCA4CT1ACTC4CG1TA4TCAGAGTG1AGT-A-C-T-2ATTG5A-T-G-A-C-3AGGA7AG21GA3CG4GA1AC7AG7ACCAAG6CT5CT4CT12GA2GA11G-2AT1T-A-G-T-G-G-A-A-7ACGA2A-A-A-4GA1AT3TC2AG24AG40TA13AG16GA5ATGA6ACAG6AG8GCAC5GC28AG32CT1GA2CT21AG15CT4CT2TA2AG31TC1AC7AG25TC10GA2-G-A-A-T-C-C4AC2CG1TG7AG4GA6TGAT2GC2CT2AGCA1TA7GA4AG8GA17GAAGAC1GA1TA1AG4GA18TC2TGAC7AG4AC5-G-G-A2GT12GA7TG12AGAG9GA2AT2GA1TC3TC12AG3AGAG18AT7GA16AG1ATAT5AG5AG2A-T-G-7TAAGAGTG1ACGA4GATC6TGCG2AG1AGGA3TA5AC30TA8GA5AG3GA22CAAGAT2GA35GACT2GATC7AG2AGA-G-A-1CTA-A-C-5TC1GATC5TGAT1ACAG3CT6GA3AG2AG12AG8AG30CA15AG2AG11CA1TG22AG13AG1AG3CA1TAAG7CG6AGAG6AG20AG8GC3GA52AG14AG40AGAG24GA8TG1AG14AG15AGAG6AG9AG20AGAC6CT1AGAG4TC5AG3C-C-C-1A-G-A-T-A-G-4GA6AG2TAAC6AG2CA1AC3TC5AG2AT1CG3AG3AC1AG7GA7TC3GAAG1ATCT4TC1TCATAC10CG4AG2GA5AG6CA13CA5AG1CA9GA1AG11AG5AG4GA4TA3CA1GT5AG1AG10AT17AG8AG2AG17AG2AG4GT24AG4CT8GA2AG2GT7TA11AC22AG4AC7GA4AG6AG8GA2CG5CTGTAC8CA1TCAG3TC3AG5CT4AG6CT13TG9TC32GAGA10AG8AGAG7AGAGAG2AGAG5AC2GC2GA7AG9GA7AG10AC13AT14CTAG7AC14AGAG9AG1AG11TG5AG3GCCT1TG11TG11CG1CA16AG4AGAGGACT13AG3AGAG5TG5GA3GTCATGCTAGGT1GACT1AG8GA1CTAG3AGAG13AG4A-G-G-C-C-A-G-T-A-A-G-A-A-A-G-C-C-A-12AGCA2AG3AGAG19AG4GA10CA1TC31AC1GTTG6CG12CG4AG2AGA-A-A-5AG13GC18GA14AG1GC4CG5AC34TA9TC5AC13CT15CA5AC22CT18AG7AG7TA7TAGCTC3AG9TA18TG9GA12GA1GATA11AC1TA8ACGA3CT1ATAG1AG7AG1AG2AG2AT3GCACAGCG1CG8AG2GACG61TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 +MK115095.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9137,9718,597,8541,9137,1,596,0.0,658,88.610,529,plus,4TA9TC5AC2AC10CT15CA5AC22CT1GA16AG7AGGA6TA7TAGCTC3AG9TA18TG5TG3GT7GA4GATCGATA11AC1TA8ACGA3CT1ATAG1AG7AG4AG2AT3GCACAGCG1CG8AG2GACG35GA25TC1AT4GA10CTTCAG2AC2TG3TC2AG13AG11A-13AG3AG4AT22GC21CT10AG30AG20AG42ATTC46 +MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9718,9026,371,9347,622,9624,0.0,10828,92.311,8332,plus,27AGAGAGTA1T-2A-1CA1G-T-G-G-CA2CGCAGA1AGCGAG2TA1T-3C-3GA9GA29AG35G-A-A-4TA24GA23AG14AG8TCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG34TC64CG39CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C8TC2ACTCGA10AG14AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG5GA5GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA18CA4GA29AG5CT50CT3CT14GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC1AT54GA16CT3AC16AC35AG4GA2AG15TA8CA35TC11AC14TG3AT10TC7AGTC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC13GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACT6TGCT59GT5AT21TC12AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TCAGAG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG4GAAGAC6AGAG4AG7GA9CT17GA2GA11GA6AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC2GA32AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT3GA-A-A-T20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T1GA1AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG5AG42GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT14TC6CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA23AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT13GA4GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9718,542,8815,9347,1,540,3.18e-176,616,90.221,489,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GAGA4GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-10TC16G-6TC39GC18GT2CT8ACGT87 +MK115490.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9347,9718,28,91,118,622,649,0.002,42.5,100.000,28,plus,28 +MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9718,9047,269,9266,600,9624,0.0,10873,92.384,8358,plus,5TC2GTGT2AGCTTC2AT1ATTGCGCA23C-TA1TA2TG1AC2A-2G-1TACG1CGTACA2TG4T-C-T-1TC2C-13GA29AG35G-A-A-4TA24GA23AG14AG8GCCG44GA10TA31TC2CA5CT23GA2AC58AG8TA4GA8GATC12AG12CG2GA2CA22GC3GA31GA8A-G-T-15-ATG7GC2AT3-G-T15CT12CA23CG2CA43AG5CT14CG86TC17AG33TG99CG5CT33CT18TC22GA17TC8TC4AG47GA4TC7TC57TG4TC29AG8AG2AT8GA20AG5GA2GA5AC8AG32-A-A-C11ACTCGA25AG49TC5AG54TC11CT5AT26AG12CT4AG14CT2CT49TC5AT8TC7TC16AG1GT18CT2GATA9AGAG13GA13GC19TC1TA2AG6TC54AG65CT18CT21AG47CA7TC2CT17TC8AG101AG14AG50TC53CT20TC29TC60AG11AG4AC34CT3TC20GA3GC13GT71GA11TC80AG17AG83GA18AG1AG50AG5AG21GC37GA20GA3GA43GA2AG3TC3GA52GA13CGAC1TA2AC2GA107AG5GA3GA28AG13GA3AG2TC8AG11GA9GA7CT35CT32AG32TC23TC2AG2AG11CA14CT3GA1CT14GA3AG2TA7GT14AG46CT31AG29AC1GA23GA29AG5CT50CT3CT8AG5GA6GA10CT25AT2CA36GA10TCAC1AG2CA46AT9GA20TC36CT7GA65GA20CT5CTCT1GA3CT7GA26AT21AG2AGAC1GATC5AG18AG2GA17CA38CT122TC23TC15CA19GA51GA28TC44TC17GA11AG17CA60CA21CT8AGAG4AG3AGAG30AC56GA16CT3AC16AC35AG4GA2AG15TA6AG1CA35TC11AC14TG3AT10TC8TC38CA21AGAC8CT9GA1GAAG1GT12AG10GC25GA3AC30TC14TC16AG14GT18CACTGT17AG26CT6AG10GA13CTCT20TC9CA26AG2GATCGT1CG55CT21CG7TC2CT46AC56CA3AGGAGA10GC6AC25TC14CA1GA1ACCA4CT11GC4AG8GACT22AT7GATA1AC28AG2GAGA21AC3GT36GA2TACAATGAGTAC2AC1-C4CG-G2CA-T1CGTGTGAG23GT41GC23AG5AG7AC21GA15AGCACTCA6CT59GT5AT34AG26GA6AG53CG6TG6AG2CT1-G-A-A5TA15CT5TC1AG1-A2GAGT2AT1G-4CA1GA3AG1-G-A-G2GA1GA20CG5AGAC6AGAG4AG7GA9CT17GA2GA18AC3AC2TC4CAAG4TC2AG57TC38GA5GTGA6AC10TA12AC35AG9GA11AG15TC30ATAC9AG25TG5GCGAAC1CT2AG2CG33TGGA5TA4CG1CA1-C-C-A-G-A-G9AG8CTTGAT1GA3CT4G-C-C-1TA7GA4AG18CA8AGAC1GACA9TC12GA3TC1GAAGAC7AG8AT2-G-A-A1GT20TG2CA24AG3TC3TC1CG27TC6AT7GA18-T-T-T13-G-T-A3-A-A2-G-T-C-A3GACATC2CT3TGTG1GAAG2GAAC1ACCA5AC20GA10GT6AGGA31TC2AT3AC29TC1AG6GATC15CT1CGGC1GA1-A-A-T3AT1TC4CT26AG12GA35GA22GA21AG30GT46GC3GA16AG5GA1TAGA20AG5AG14AG17AG48GA23CA12GT6AG44CT30AG1TA9GA2AC3TC18AC21GAAG1ATCT4TC2AT11AG1GAGT4GA8GA29GA41AT11CT29AC3AG29GT7AG51GA30TC18AG17ACGA18TC10TA10CT21CATG2GA33AG36AGTC7CT9GA6GA10TG6GA7GA7AG7AGTC6TC9CA42AG14CA3TG11CG25GACTAT3TC5AG5GT22GT1GAGT10GA23AG16ATGA12TC17GA10GA33AC3CT8GA11AG5CGA-G-T-2AG16GC9GA19TA3AG1GC4CG1CA48TC9AG18CT6GA5AC50AGCT21GA5TC1TA15GT5-A-G-A-T-A-A-G-A-T13CA12AC1TA14AGCT18GT8AG1AG6AG3AGTA5AG28AG11ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9718,542,8734,9266,1,540,6.01e-178,622,90.590,491,plus,14TC8ACAG18CT6GA5AC24GA26CT21GA5TC1TA15GT5-A-G-A-G-A-A-G-T-T6GA5TCCA12AC1TA14AGCT12GA5GT8AG1AG6AG3AGTA5AG40ACAT14AT3AGGA11TC6TG4A-27G-6TC39GC18GT2CT8ACGT87 +MK115576.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9266,9718,73,220,271,577,649,8.11e-04,44.0,71.233,52,plus,24-A-G-A-C-C-C-T-T-T-T-A-G-T-C-A-G-T-G-T-G-G28 +OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9718,9719,18,9686,1,9573,0.0,11704,92.437,8984,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA164-G1TG5GA12TC31AG25CT82GA3AC97CT3AG14GT20TC8TC7GA28AG16TG35GA19CT5GC26CT8GA19A-C-A-C-A-G-G-A-A-A-C-A-G-C-A-G-C-C-A-G-G-T-T-A-G-A-C-8AC6GACT26AG6CA1TC89AG50TC11TC75CG1AG20CT76CG11GA27CT41GA8TC93AT70CT20AG41GA8AC5AG29CA12AGGC1GA16GA11AG12GACT27GA5TC1TC5AG99AG12CT4AG20CT24C-C-A-13TG8TC2TG2AT16TC7AG8AG17T-C-C-7GA9AGAG46GA26GA23CA4AG3AG73CT117TC8AG101AG14AG119GA69TC38AG37CT86TC22AT5CA2GA9AC2GA26AG29AG6GA13AG19AG7TC4TC2CA17AG26GT48AG1CA32AGCT7AG5AG32GA4AG21GA24GA4GA18TC19GA26GA51GC4AC10TA52GACT55GA8GA19AG1TC11GA3AG77CT2CT14AG47TC29AG6ATAT22GA1CT21TA10TC33CT19AG35CT5GA24AC21GA12AG5GA20CT59TC21TC19GT107GA23AG8GA27TC26AG49CT11GA20CT5CT41AT21AG2AGAC8AG21GA17CA203CA5CT6CT15TC40GA28TC26TA126CA30AG9AG23TA7ACAC8AG27GA1AG10CT61GA50CA26CT8TC11AC14TG3AT19TC47GA37GT9CT13AC3GA2AG5AG47TC14TC24GA27AT9AG11TC19AG14GA33TC7TC19AG16AG3TC40GA34GAGA13CA3TC11AG2CT25CT8GC43CA6CA3AGGA11GC6GC1CT5CT32TA2AC5TG14CT11GACT4CA26CA31GA24AC3GT27AG5G-G-G-G-G-A-T-C-3A-4TA10-T-G-T-G-G-A-G-A-T-G-G-G8GT6TC1TA10AG16AG10CAA-A-C-10TC29AG7AC37AGGA66GA5AGAGAT21TC6GA5AG22AG27TC16GA5TC13CG1CT4TG3-A-C-T-G-A-T-T-T-G-A-A-G-A-A-T-G-A-T10CA3GT5TC2AG1-G-A-A-T-G3CA1-G-G1CGCA2TG2AG-A-G2GA15TA3CT1GAAGAC3GAAG8AG4AGAT1-C5G-9CT8GA11GA4CA6GA1GT4AC2ACGC1A-T-A-A-G-A-G-T-A-A-T-A-A-T-A-T-T-A-4T-T-C-2GA3AG1TC6CT11TC8AG71GA6GA6ACAG14GA23GA14TA53CA13AG4AGGT10AG28AG2TCGAAC1AT5AG40TA2AC1CG3-C-C-A-G-A-G19TGAT1GA3CT4GA1C-A-T-7GA1CT2AG20CTTACG9CA4CAAT21GAAGAC6GA2AG9AGGAGA1AT12GA7TG1CACA20GAGA6TC16AG30CA19ATATG-G-A-G-A-C-4GA1GT1TC5C-T-C-3TC2GA2AG7GA1T-A-G-T-G-C-T-A-C-T-A-T-C-A-4AG2TG2T-5TC2TA5AC4AC3TC1AG5GAGA12TA8GA33AGAT11CA4TC6CT18GATC12CT4AG2CAGC2CT1GA1AT18TG9AT76GA27GA8-A-G-T1AGCG1TA1GA6CT46GC3GA24TA21AG20AG66GA24GA45CT9AG14AG26AC1AG9AC1TC1TC18AC9GA20TC2AT5CA13GA14AG6AC21CA25GA10CT18AT14AG32AG37CT14CT4TC5CT4GA1TC28TC5GA31GAGT2CG14TC3AG6TA6TA3CT57GA40TC8CTGT6GA9AG8CT23CT11CT45AG2TG5AG18TG3TC7CG25GACT22AG13AGGTCG1AGTA11GA20AC5G-A-G-C-C-A-G-C-A-G-C-A-15GA30GA3CT24CG2AG37AG25GC33AG2GA61CA2AG9GT15GA4TC2TC8TC1TA13GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 +OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9718,663,9,671,9076,9718,0.0,792,92.006,610,plus,3TG2CGTA22CA2AG9GT15GA4TC2TC8TC1TA13GC1TG21AG30TA4TC10GT12GA14GA10TC1AC1TA14AG6AT12GT44GA7GA32A-C-A-A-G-G-A-C-T-G-C-T-G-A-C-A-T-C-C-AT15AT7TG31G-46GC36AC42GA133 +OQ092466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9686,9718,509,9178,9686,1,489,3.68e-161,566,89.194,454,plus,21CA1ACAG9GT15GA4TC2TC8TC1TA11GA1GC1TG52TA4TC10GT8TG3GT7GA5TCGA10TC1AC1TA14AG6AT6GA5GT44GA7GA4GA27AT4GA11C-C-A-C-A-A-G-A-A-C-T-G-C-T-G-A-C-A-A-7TG31G-46GC36AC31 OQ092463,Ref.B.TH.90.BK132.AY173951,0,9605,8996,8952,688,9605,1,8896,0.0,10987,93.186,8342,plus,4TC12GAAG12AC45-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T-G-A-G6-A-A-A-A48GA15GC16AG1GA10AC24AG36GA2GA20GA2AG9AG17TC3AG13TACG26AG16GA5AGCT12GA14TG26TG14GA20AGAG17GA6G-2A-C-5C-C-A-G-A-C-8CTCT23GA2CT2CG68GA125AG144AC19AG8CT2TC21CT38CT26TC31AG14AG3TGGCTCAT31AC2AG14AG11CT20AG53AT2TC8AG14AG17AG4CA1CT3GC17GA9CT8GA7AT15CT17TC5TCACAG18AG2AG1GA11AG9AG23CT5GA44GA35AG13AC21GA30CA1GAGA13GA9GA2TG6GA74AG23CA4CA63GA54GA35CT4AG5AGAC22CT107CT23GA32TC77GA53AG11GA8AG56GA20TG4TC79AT124TG3TC1AG16AG21CT38AT32GA9TC4AG5GA5TC80AG26GA28GA3AG11GA30CA26AT7CT11GATA61GA8GA17AG23GA3CT23AG37GA2TC16GA12CA47AG23AG20GA5AG2TC17TC14TG2AG38TG38TC11GA23TC32CT66TA4TC1AG12AG9AC7CA5AC26AG63TC25TA2CG5GA20GA68CT3TC7GA17AG29GA11CT44GA54AC30CA32TC9AG8CT5CT32TC38GA20CT35GA22ATCT83AG30CA67CG140GAGA33AG6GA16GT1TG4AGGA9GC1CA2TC26TA2CT11GA2TG2GT1AGAC10CAAG32CA5CT8GA20-G6G-7GA15TA25GT30CT22GA21TA48GA9TG9AG28AG53GA65CT6CA11AG1CA9CT12CAAT5AG2TC17AG7CT36AG10AG18CT1TC2AT2GAGA18AG15TC33GA3TG7CA1TA4TC8GACA1GA28TC2CA5GC50AC3AG3AC41CT10ACCT5GC6CT2CG22AGTG31CA31AG12AT15GT30CT2GA2GA14AG7T-T-G-16CTGCAT13GA8CTTA8AG7AT47TC13AG23GA6GA17TC49GT12GA8CY7AC4GA6TC42CT23CT17GA9AG3A-1AG1TG1A-C-A-C-C-5CT4GA6G-A-A-T-A-C-C-A-C-C-C-C-7AG1T-G-C-T-A-G-T-A-G-2GA5GT1AGTA2GC1GA10AG30CA4AGGA5AT27GA2CT16GA16TC35AC53AG26CTAG12AG4TACAAC10CA13AG21GA9GA11AG3TC26AG22CTTA28TG5GA2TATC12CA5TC6CT6AT7AG5TA3CA15AG2CT2TA2TA1GA9CACA19AG12AC4AG2AGAC2GA19AGCA6TG7GA4GA10G-G-G-2TC5GT6AG7TGCA1CA28CT5AG5AT20AT7AT2TA26GAAGGC3-G-A2TGTACATA2-A-C2AT3T-3TGCA2A-T-G-1CA1CA24GA6AG5CA40TCAG6TACA4AG3TCTA1AC8CT12AT13TA2GT2ACAC1TA4AG2GC4AGCACG2CT2GA2TC10AG14AG19TC38AG10CT54AG50AG1AG22AT34TC77CT1GA38AG26TC42AT7ATCG8GA35GA11AG4GA8TC44AT3TC2GC46GC41CA18GA5GA4GA10CT6AG40CT27AC1AG8GA29GC8CGAC6AG1CT15AT10CT7GA76GA11CGTC6GA17GA33AG10TC5TC5CT23CT3AG21CT1GTGAGT6TA15GC6AC37GA1TC13GTTG4T-2T-T-G-G-A-9AG17CA2GA2GA7ATG-C-A-17GA104-G-G-G12TC7GAGA29TC4CG4GC44TC13GAAC34CT29CT18AG1AC4ATTC32GA14TC23AG2GA6AT21TA12TA5AG15GA1AG4GAAG8TC11TG18CATA21TC8CT52GT75TG12 OQ092463,Ref.B.TH.90.BK132.AY173951,0,9605,8996,576,38,613,8421,8996,0.0,756,95.833,552,plus,11GA11AC34CT29CT18AG6ATTC47TC23AG2GA6AT21TA12TA21GA1AG4GA9TC11TG18CATA30CT45TC6GT89TA98 OQ092465,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9659,8890,8931,654,9563,1,8890,0.0,10476,91.278,8152,plus,18TA2CT13A-32T-TC11GTGAAG42CT32AT9TA1AT47GA26GA26AG16AG10AG19AG8GA2TC17GT5AG6AG17TC23CA30AT13AGCT19CA7TG8CT5GA49TC13AG3AG11AG2GA33TC2CT20GAGC2AC31AG2AG13CG3CT1GA39AG5CT8CT12CT4CT41AC29TC5GA17GA5TCGC16AG5AT11CT5AT5TA7CA16GCGA11AGTC2TC6AG7AG23AC5GA7AC2AC1AC5AG1GA8TC3AGCT7CT9GA6AG5GA2ACTCCTCT25AT6TC6GCCTCT2AG14GA6AGAG12AC2AC2AG5CT1AC6AG5AC2CT2CT5TCAT10AT2AG2AC4CGAGGC2AT4AT6AC3TC3ACGC1ATTG3AC16GA7AG14AT2AG12GATC5CG1CG3GC2C-C-A-12GA1GA1CT2TC2CT1GA1AG9AGGA1CT6GA5CT2CT14GA2TC5TC25GA21AG8CT11TC8GA22AGGA2CT17GA5AC8TC11AG9AT12CA15CT21TC40AG10GA20CACA1CA6AG9GA3GA2AG1TC18CT32GA1CA11GA47GA10CA1GC3CTTCTCGA4AC2CT8TC2AG4TC9TA8AG41AG5TC2CT11TC102GA7CT23GA32TC29AG38AG10GA117AG2CA116TC100GA16AG4TG3TC1AG14GA1AG42TC17GT42TC10AG5TC8TC14GA5GA29CT11GA4AG11GAAG7AG9GA11AG15AGGA33AG39AT19GATA13AG3GT55AG10TC3AG11TA14GA8GA15AG30CT6GA6CT1AG8AG1GA3AG8CA10CT81GA29TC11TG8CT5GA6TATA22AG1TC20CTTC4AG2TG5CA18TC10TC3CT20TG4AG20AC58AG12AG17CA5AC2CTCT73GA2AGGA34TG2TA27GT29GA37CT3TC7GA44AG2GA59TC35GA68TCGA15CATC2AG47AT27GA16AG14CT35GA8AG13AT3AT44GA45TC20CA64TG144GA8AC18AG5AG6AG8AG1GAGAAT3AG7GA11CA2TC1TC1AC6AG15TA20AT5GA3AG3CT3AT87GA9GA11GA9TC8CT56TA5TG32GA27CT2AG39AG34AC3CT53GA23CT8GA8AC2CTAG7GA17AT5AG53TC7TA9GA23CTCATC2AG2GA35TC13GA2TC5AG17TC6TACATA2TC2TC5GACA86GA3AC6CT16CT12GA9GT13ACCT5GCTA5CT27GA21TA7AGCT1CA23AG7AG18TG8GA32GA5TC12T-C-A-G-C-A-2TGG-T-T-5GA8CT29GACT3AG5AC3TC15TC8AG18AT1TC5TCCT21AGAC3TGAT2GATC17GT5TC26CT8AG3GA9GA12GA21GA10AT2GA8GA26TC5AG35GA13AGTG4ACCT3GAGA1GACACGATATTG3AG1CT3AGGA8CG2CGC-A-C-C-C-C-3TA1C-C-A-C-T-G-T-3T-2C-2GA4GT2TA2G-G-G-1A-G-G-6AG18AG5AT5CA2AG2GA25CT7GA2CT4AG11GA5AGCA4-A-C-A-A-G-C4GCGATC6GA24GA15AT7GA21GA17AC13CTAG6CAGA9TA22CT25GA51GA5AG20AGGA12AC12TG6AG2TA17AGTA25AG6CA1AC1GA3CTCTAT4AG6TG1TA11CACA24CT7ACAC6AG3GA6AG1TA9GA1GA1AG1GA2TG3AC3GA3AG11GAGAGA3-C-A-A5GA7TC3TCAG3AT25GA1AGACCT5AG3TC1AG15TC15TA2AC1AG4TA8CA1TA4TG-C-A-G4CA2GA1TGAG-C-A-C6GTGAGA1GA1AT3-A-G1CA1AT2-T5CT1CA24GA12CATG41GC4CGTCCA4AG5CT9CT8AGCT19T-11GAAT1CTAGCT1GCA-C-A-C-T-16TG7AG6AG48AG9AG56TA-C-A-A61AG14GA35GA32GA59GA29GA2AG26TC24GA17ATAC3GAAGCAATCG1GA6GA1TC17AG27AG2TG9CACT12TG27TA10GC4AG4ACAG24GA10GA17AG26GA26GA2TC7CT36TC7AG11CA18AC1AG11GA20GAAG9GAGT1CACG6GAAG1CT14TC7TACA5GA53AG6AG20GA11CGTC6GA5GC34AG10AG4CT11TC5CT17GA18GA2TG6GT1GACTATGT1GT6TA17AC16GA5GA7TA4AG21AT4TCGA3TG3AG3CA2AGACATAG20GA11GA1AT2AG25CT10CT19CT23CT8TC32GA5TC2TC8GA29TC2GA1CG4GT70TG21CA10CA27CACA30TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GAAG8TC5GA7AGTC3AG1GA3CA19CT5GA11CT4CT8AT10GA20 OQ092465,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9659,8890,382,66,447,8509,8890,8.94e-130,462,92.147,352,plus,36TG21CA10CA27CACA30TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GAAG8TC5GA7AGTC3AG1GA3CA19CT5GA11CT4CT8AT10GA20 -OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9719,9788,1,9708,1,9719,0.0,11340,90.785,8886,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC7A-32TC6TC5TGAGGA39-A17-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T-G-A-G7T-75CTACAG43CA1GACT28AG5GA5TC11CT17GA2GA17AG2GA2AG5GA2CAGT1TC25AG4CT3TA1CA33AG7GA1GA11AG11GC20GC14GA14CA12AC1TC1AG2GACT35GC5AG15CG2CA35AG7TG11TC8AG12AT37TC87TG1AG11GT9GA4GA9CA1AGCA4GA34AC9GA7CG10CA11GA16CT15CA1TC29CT5CTGATC17AG60TC5GA11TG35GA29GA8AG8AG6TC41AG7AG33GA5CT6GC27AG12CACT1AG13CT11GA5TC1TCTA2TC1AG23GA76GA11CTGA6GA14CT49TC5AT6GA9TC7AG1CA31GA10AG40AG26CT20TA13AG11AG6GA95GA50AG5CT32AG40GA43AGCT15AG14AG5CT36AG16GA5TCGA3AC54TC29TC2TA69AG1GA26AC8CT1CT27CT14GT53TC2GA35TC20AG8GA27GA13AG14AG4AG7TC67CT24TG28TC23AG8CT23AG2CT11GACT16GA23GAGA12CA30GA50TC12CA51AT21GA14AG3AG14AG32GA1TC42TC1AG24GA9TC30AG11CT21CT13GA2AG14GA11TC23TC5AG30GA1CT1AG19CA7GT24CT11CT19AG66AC1GA11AGCT6GA24GA14CT53GA59AT44CT15AG10GA14TC5CT9TC40TA11GA15CT2AG8AG61GA8AG11CT5CT2GA38AT21AG2AGAC1GATC5AG3TC17GA5AG11CA25AG4AG55AT36GA56AG28CT63GA28TC77TC2CT72GA14TC6CT2AG1AT3AG9AG1AGAGTA5GT21ACTC51AG25TA52GA3GA9AC17CA29TC5TC11GC14TG13GATCGA7TC30CA16GA12AG21GA2GT23GC50AG9TC11GA7AG11AG5AG1GA27AT5TC5AC2GA2AG2GA14AT62TC2-T12AG21AG3AC2TG15GA6TG14CA35GA17TC14CT28AC5GC49TCCA3AGGAGA4GC12TC7CT24TC2GA4TA2GCAC5CT13CT11GA2CA22TC6CA44AT2GA1GT6AC3GT15TC5AC14GA2TACA-T1GTGC2GC1AC2AG1CGAGGACG1CTTG-G-G8GT8TA13AG17CT5GA2CA17CT20AG15TC19CT64GA19AGAT15GT5TC12AG20CG23GC10AG31CG6TG6-G-A-T-T-T-G-A-A-G4CA5TA-T-A-C2GA1GA3-G-T-A-G-C-G-G-G-A-G-A-A-T-G-A-T-A3CG1-G1CA2AG3AG21GA3AGTC4AGAC3GA8AGAT10CTGA4CT17GA2GA11GA6GCT-A-C-T-A-A-T-A-G-G-A-C-T-A-A-11GA5TC12TC14AG71GA3GAGAATGA4AGGAAC17TC5GC15CA17CT21TC7GA19GA14AG5ATAC3AT5AG6TC21AG2TCGAAC1AT5TGCA18TC1GA14GA3CA2AC1AG3GC-C-A-G-A-G-A14CA3TGAT1GA3CT4GA1A-A-T-7GA4AG2GAAC7GT4TA1CA1GT1AG2AGGAAG2GA1CA4GA1GA9CA1ACGA8AGAC6CAAGCAAG1GA6CG-G-A-A-A-T-A2GAGA1CA5GACTAC3GA22TA6AGCT2TC5CG30CT2CTAT2TA2GCCAGATC6GACTGA1GT2CT3ATAT1GAGA2CG1GA6CG2AC2CATAAGCGTG1GCGAGAGA3TC1TC2CA3TA1-G-T-G3ACTA5AC4AC16TA9GTAG6GA34AT3GC52CT1GA2AG2C-A-2A-A-A-T-G-G-T-G-G-C-G-A-G-A-A-T-G-G-G-A-C-C-C-A-G-A-T-T-G-G-C-G-A-G-4TA1AT2CG22GA32CT23GA9AG19AG32AGAGCG1TA1CA53GC8AG19TA21AG12CT7AG17AG32AG5TC34GA15AG39AG32AT8AC1AG6GAGAGTAC3TC18GC9GA7TC3GAAG7TC2AT11CG7GA5AG32GA12GA1CT15GA10CT18AT22TC2AG26GA11AG20CT11AG2CT7GA7GA2TC27CTCA2CA33GAGTATTCCG14TC3AG5CT6AGTA3CT8TC4TG14TA26CT1GA37GA26GA38TC5TC5TC1TC3TC3TG7GT5AG9AG9CT1AG5AG2AGTC12CTTCTGAC10CG3GA14AG6GACT23GT9-G-T-A-G-T-G3GTGT6GCTC1GA12AG6GA3AG1T-A-A-G-C-C-A-G-A-A-G-A-13AG2GA7GA15TC4GA3TC4CA3CA18TC6TC7AC2TGAT2TC20AG11CT10GC6AG28GC4CG7CT42TC9AG3GA21GA1TCCT16TCCT9GA25AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 -OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9719,635,1,634,9086,9719,0.0,755,91.811,583,plus,14TC9AG3GA21GA1TCCT16TCCT9GA25AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 -OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9719,637,9075,9710,1,636,0.0,749,91.366,582,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-11 +OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9718,9787,1,9708,1,9718,0.0,11355,90.835,8890,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC7A-32TC6TC5TGAGGA39-A17-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T-G-A-G7T-75CTACAG43CA1GACT28AG5GA5TC11CT17GA2GA17AG2GA2AG5GA2CAGT1TC25AG4CT3TA1CA33AG7GA1GA11AG11GC20GC14GA14CA12AC1TC1AG2GACT35GC5AG15CG2CA35AG7TG11TC8AG12AT37TC87TG1AG11GT9GA4GA9CA1AGCA4GA34AC9GA7CG10CA11GA16CT15CA1TC29CT5CTGATC17AG60TC5GA11TG35GA29GA8AG8AG6TC41AG7AG33GA5CT6GC27AG12CACT1AG13CT11GA5TC1TCTA2TC1AG23GA76GA11CTGA6GA14CT49TC5AT6GA9TC7AG1CA31GA10AG40AG26CT20TA13AG11AG6GA95GA50AG5CT32AG40GA43AGCT15AG14AG5CT36AG16GA5TCGA3AC54TC29TC2TA69AG1GA26AC8CT1CT27CT14GT53TC2GA35TC20AG8GA27GA13AG14AG4AG7TC67CT24TG28TC23AG8CT23AG2CT11GACT16GA23GAGA12CA30GA50TC12CA51AT21GA14AG3AG14AG32GA1TC42TC1AG24GA9TC30AG11CT21CT13GA2AG14GA11TC23TC5AG30GA1CT1AG19CA7GT24CT11CT19AG66AC1GA11AGCT6GA24GA14CT53GA59AT44CT15AG10GA14TC5CT9TC40TA11GA15CT2AG8AG61GA8AG11CT5CT2GA38AT21AG2AGAC1GATC5AG3TC17GA5AG11CA25AG4AG55AT36GA56AG28CT63GA28TC77TC2CT72GA14TC6CT2AG1AT3AG9AG1AGAGTA5GT21ACTC51AG25TA52GA3GA9AC17CA29TC5TC11GC14TG13GATCGA7TC30CA16GA12AG21GA2GT23GC50AG9TC11GA7AG11AG5AG1GA27AT5TC5AC2GA2AG2GA14AT62TC14AG21AG3AC2TG15GA6TG14CA35GA17TC14CT28AC5GC49TCCA3AGGAGA4GC12TC7CT27GA4TA2GCAC5CT13CT11GA2CA22TC6CA44AT2GA1GT6AC3GT15TC5AC14GA2TACA-T1GTGC2GC1AC2AG1CGAGGACG1CTTG-G-G8GT8TA13AG17CT5GA2CA17CT20AG15TC19CT64GA19AGAT15GT5TC12AG20CG23GC10AG31CG6TG6-G-A-T-T-T-G-A-A-G4CA5TA-T-A-C2GA1GA3-G-T-A-G-C-G-G-G-A-G-A-A-T-G-A-T-A3CG1-G1CA2AG3AG21GA3AGTC4AGAC3GA8AGAT10CTGA4CT17GA2GA11GA6GCT-A-C-T-A-A-T-A-G-G-A-C-T-A-A-11GA5TC12TC14AG71GA3GAGAATGA4AGGAAC17TC5GC15CA17CT21TC7GA19GA14AG5ATAC3AT5AG6TC21AG2TCGAAC1AT5TGCA18TC1GA14GA3CA2AC1AG3GC-C-A-G-A-G-A14CA3TGAT1GA3CT4GA1A-A-T-7GA4AG2GAAC7GT4TA1CA1GT1AG2AGGAAG2GA1CA4GA1GA9CA1ACGA8AGAC6CAAGCAAG1GA6CG-G-A-A-A-T-A2GAGA1CA5GACTAC3GA22TA6AGCT2TC5CG30CT2CTAT2TA2GCCAGATC6GACTGA1GT2CT3ATAT1GAGA2CG1GA6CG2AC2CATAAGCGTG1GCGAGAGA3TC1TC2CA3TA1-G-T-G3ACTA5AC4AC16TA9GTAG6GA34AT3GC52CT1GA2AG2C-A-2A-A-A-T-G-G-T-G-G-C-G-A-G-A-A-T-G-G-G-A-C-C-C-A-G-A-T-T-G-G-C-G-A-G-4TA1AT2CG22GA32CT23GA9AG19AG32AGAGCG1TA1CA53GC8AG19TA21AG12CT7AG17AG32AG5TC34GA15AG39AG32AT8AC1AG6GAGAGTAC3TC18GC9GA7TC3GAAG7TC2AT11CG7GA5AG32GA12GA1CT15GA10CT18AT22TC2AG26GA11AG20CT11AG2CT7GA7GA2TC31CA33GAGTATTCCG14TC3AG5CT6AGTA3CT8TC4TG14TA26CT1GA37GA26GA38TC5TC5TC1TC3TC3TG7GT5AG9AG9CT1AG5AG2AGTC12CTTCTGAC10CG3GA14AG6GACT23GT9-G-T-A-G-T-G3GTGT6GCTC1GA12AG6GA3AG1T-A-A-G-C-C-A-G-A-A-G-A-13AG2GA7GA15TC4GA3TC4CA3CA18TC6TC7AC2TGAT2TC20AG11CT10GC6AG28GC4CG7CT42TC9AG3GA21GA1TCCT16TCCT35AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 +OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9718,635,1,634,9085,9718,0.0,758,91.969,584,plus,14TC9AG3GA21GA1TCCT16TCCT35AG10CA5TC13TA25CA2GA14GACA11AC16AG16AG2GT10AG6CG3AGTA5AG11AG9CT1GA4AG25TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-9 +OQ092462,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9714,9718,637,9075,9710,1,636,0.0,749,91.366,582,plus,14TC8ACAG3GA21GA1TCCT16TCCT9GA36CA5TC13TA24TGCA2GT7GA5TCGACA11AC16AG13GA2AG2GT10AG6CG3AGTA5AG11AG9CT1GA30TC1AT3AGGA10GT4TC2TG31-G5TC4TC33ATGC40TC15AT20CT6AG1GA96TCTC1GT5TC11A-11 OQ092464,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9556,8890,8917,592,9460,1,8890,0.0,10536,91.533,8162,plus,18TA2CT45T-TC11GTGAAG42CT27-A-C-T-G-G-T-G-A-G-T-A-C-G-C-C-A-A-T-T46GA34GA35AG10AG28GA20GT5AG6AG17TC13GA3GT5CA30AT13AGCT24CA2TG8CT5GA47AG19AG11AG2GA34AC22GAGC2AC31AG2AG13CG3CT1GA27GACT10AG5CT21CT4CT23TC17AC29TC5GA17GA5TCGC16AG5AT11CT5AT5TA7CA16GCGA11AGTC2TC6AG7AG23AC5GA7AC2AC1AC5AG1GA12AGCT7CT9GA6AG5GA2AC1CTCT25AT6TC6GCCTCT2AG14GA6AGAG12AC2AC2AG5CT1AC6AG5AC5CT5TCAT10AT2AG2AC4CGAGGC2AT4AT6AC3TC3ACGC1ATTG3AC16GA7AG14AT2AG12GATC5CG1CG3G-T-A-1CTAG12GA1GA1CT2-C7A-9AGGA1CT6GA5CT2CT14GA2TC5TC14TC5GA4GA21AG8CT11TC8GA22AGGA2CT17GA5AC8TC11AG9AT34AG15TC25AG3AC10AG10GA20CACA1CA6AG9GA3GA2AG1TC51GA1CA3AG7GA47GA10CA1GC3CTTC1GA4AC2CT8TC2AG4TC18AG35AG11TC2CT11TC102GA7CT23GA32TC29AG38AG10GA117AG2CA116TC100GA16AG8TC1AG14GA1AG42TC17AT59TC23GA5GA29CT16AG12AG17GA11AG3AG11AGGA24GA8AG39AT15TC22GT55AG10TC3AG11TA23GA15AG30CT6GA4GA1CT1AG8AG1GA3AG19CT81GA23GA17TG8CT5GA6TATA22AG22CTTC4AG2TG24TC10TC3CT20TG4AG20AC20TC37AG12AG17CA2GA2AC2CTCT73GA2AGGA34CG2TA27GT13CT15GA37CT3TC7GA44AG62TC35GA15CA53GA15CATC2AG14CT60GA16AG50GA8AG13AT3CT44GA2GA42TC20CA37CT26TG144GA8AC18AG5AG15AG1GAGAAT11GA11CA2TC26TA8GA11GT5GA3AG3CT3AT68GA1AG16GA9GA1TC19TC8CT46AG9TA5CG54GA8AG39AG34AC3CT53GA23CT8GA11CTAG7GA17AT5AG53TC7TA9GA4GA18CT1TC2AG2GA35TC13GA2TC5AG17TC6TACATA2TC2TC5GACA86GA6CA3CT16CT12GA9GT13ACCT7CA3GTCT23CT1AGTC22TA1TC5AG2CA23AG5GA1AG18TG38TC2GA5TC2AG8A-T-C-A-G-C-3TG5GA9TGGA27GA4AG5AC3TC15TC8AG18AT1TC5TCCT21AGAC3TGAT3TC23TC26CT8AG3GA9GA12GA21GA10AT2GA8GA26TC41GA13AGTG4ACCT2CT5TGATCTCG1CA1AGGC3C-A-A-8CA5CGC-A-C-T-A-C-3TA1GTCA1GA4AG1GA10GA1G-A-G-2AG18AG5AT8AG2GA5GA19CT10CT4AG11GA9AG3TA2TC4GCGATC6GA24GA23GA21GA17AC13CT8GA15TC16CT25GA51GAGA4AG20AGGA25TG9TA17AGTA25AG6CA1AC5CTCTAT11TG13CACA24CT7ACAC6AG3GA6AG1TA9GA1CA1AG4TG3AC3GA3AG11GAGAGA-A-A-T-C-A-A5GA7TC3TCAGCA2AT22GA2GA1AGACCT5AG3TC1AG15TC18AC1AG4TA8CA1TA4TG-C-A-G4CA2GA1TGAG-C-A-C6GTGA2GA1ATAG2TACGAT3GAACCT5CT1CA24GA12CATG39TC1GC4TGACCA4AG5CT9CT9CT2AT16G-A-A-A-9AG1CAAT1CTAG-T26AG55AG9AG55-A-A-C10GA52AG14GA7TA34CT25GA59GA29GA2AG26TC24GA22GA2ATCG1GA6GA1TC15GC1AG7GA19AG2TG9CA10AG2TG38GC4AG4ACAG24GA10GA17AG26GA29TC7CT36TC7AG11CA18AC1AG32GAAG9GAGT1CACG6GAAG1CT9AG4TC7TACA5GA53AG6AG32CGTC12GC34AG10AG4CT17CT17GA18GA2TG6GT1GACT1GT1GT6TA17AC22GA7TA13TC11GAAT4TCGA3TG3AG3CA5AG20GA-C-T-G-A-G-C-C-A-G-C-A-A30CT10CT19CT23CT8TC26TG5GA5TC2TC8GA32GA6GT50CT7AG11TG21CA10CA27CACA15GA14TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GA9TC5GA7AGTC3AG1GA3CA19CT5GA16CT8AT10GA20 OQ092464,Ref.28_BF.BR.99.BREPM12817.DQ085874,0,9556,8890,380,6,385,8511,8890,4.64e-128,456,91.842,349,plus,14CT7AG11TG21CA10CA27CACA15GA14TC20AG8GT5TAAC8GA26TC18TA34GA1AG4GA9TC5GA7AGTC3AG1GA3CA19CT5GA16CT8AT10GA20 -OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9719,9751,61,9718,1,9719,0.0,11550,91.734,8945,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA5CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA185TC5AG6TGAGGA8AG45-G-A-G-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T13TA72ACAG27AG5AG3CA4CT12CA49TGCT4GA11GC30GT1TC21TC48AG7GA25GC2AG18CA17G-4-ATA18AC4AC1GACT33CA23CG1TCTA35AG28AG12AT53AG1AG2TG38TC27TG13GT9GA13AG43AC28CA25TA2CT17TC5GA30GATC3TC8TC4AG54GA14ATAT7AG5GA17TC3CT13AG2TC29AG8AG38GA2GA5AC5CT2AG42-G-C-T2TCGA28TC10CTAT32TC1TC3AC20AG26AG5GA60CT7GA25AG38TC5AT16TC12GA28GA9AGAG34AG11GA50TA4AG3AG7AG21AG45GA91CT2TC20TC8AG101AG14AG50TC14TC17GA65GA5TC35AG14CA9AG11AG16CT22CT92GAGA2AC5AG59GA20AG23AG19AG100AGAT15TC20CA14AG26TCGC4AG32GA5TC18GA12CA30GA17GA24AT1GA6CT11CA17AG1TC26AG26GA35GA30GA3TC27CT12TC1AG2TC8AG26CG26TG11CT17AG20AG26TC23TC2AG2AG4GA2CT3CA18GA16GA6CA7AT11CT44AG20GA18CT26AC1GA19GA24GA14CT63TG13GAAG20AGCA15TA7GA3CT5CT39AG2AG54CT18CT29GA15AG61GA8AG11CT5CT6CT22GA3GA7AT2TC18AG5GA6AG21GA17TA29CAAG40AG8GT99AG40GA8CT42GA1CT26TC68GA14AG69CA20AGCT4CT3AGAG8AG7GT10CT12AC1CT26TC5GA8AT8AG6GA40CT30GA6AG5TG18CA24CT4TC5TC11GC14TG3AT2GT6GATCTA11CAAG13AG28GA13TC12GA10GT23GC4TC39AG15TC1TC5GA23AG7GA27AT9AGAG6AG3TC1CT7CA19AG13TCTA31TC2-T12AG4AG16AG22GA57GA3CG46CT10AC52CG3CA3AG6GC13ATGT30TC6CTTA2GCTC4TG26GACT22AT7GATA1AC32GA5TC2CGAT5AG5AC3GT39T-C-A-G-G-2GT1A-T-T-G-2GA18C-A-C-C-A-T-5AG21AG22AC4CA16TC23AG15TC14AG16CTCA7GA41TC15CGCT5AT21TC12AG25CT24TC36TG6TG6AG2GT1-G-A-A5TA5CA2AC5AG6TCAG1T-3GA1ATCG1GT-A6GATA6AG23TCGACG6AC4AG1AGAG4AG1AGAC14CT5AT3GA7GA2GA10GTGA6AC3AC7TA5TC2AG6TC10CT22AT7AG41AT12GA4AG1AC23ACCA34AG9GA23TC18AG5GA9ATAC9AG31TC1AC1AT2AG15TC12TC14TA2-C-C-G-T3TCTATG1-G1-G4GA3CAAG4AT2TGAT1GA3CT2AG1GA1C-A-T-12AG23GT3AGAC1GA1CA3GA4ACGA5GA5GA3TC1GACGAC18-G-G-A2GT12GA7TG14AG16TC3TC13CG21CTAT5AC1GA18ATA-T-G-6AGCT3CT3AG1-A-C-T-G-A-A-G-G-G-T-C-A4CATC5TAAGAGTA2-T-G-A3CA5TC5GA25GTAG6GA22TC10AGAT2GA7AG22TC1AGTC20GATACTCA2GAA-G-G-4CT1CACGCT1TC8TC26TC44GA11GA32AG4GA12AGAGCGGACA1GA6AT46GC26GA36CT29AC44GA20TC2CA16AG44AG9AG20TC5AC10ATAC3TC18GC1AG21GCATCT4TC2AT43GA14GA5GA24GA10CT18AT7CA14TCAT1AG5GT15AG4GA41GA2AG2CT7GA1TC5GA1TC11AC16CT37GAGTGT1AG14TC3TG2GA14CT4AG23GA28GA24AG12GA26GA5CT20GT11TC5TC11TC45AG2AGTC1GT12TG6CA23AG6GACT32TA5CG2GA11GA2AG26C-C-A-G-C-T-11ATGA23TC17CA6CG3TC13ACTC20GA17AG8GT10GC33AG1GC4AG1GA6GA41TC6CA2AG9AT15GA30GA9TC15AGCTTC9TC1AG16TA25-A-A-G-A-T-A1-A-A-G-A-G-G-C-C-A-A-T-A10TC1GC1TA1TC3CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2TC2-G16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 -OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9719,636,59,675,9084,9719,0.0,705,88.994,566,plus,16TC6CA2AG9AT15GA30GA9TC15AGCTTC9TC1AG16TA23-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G-C-C-A2GA10TC1GC1TA5CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 -OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9719,636,9104,9720,1,636,0.0,699,88.836,565,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA1TC3CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA168 +OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9718,9750,61,9718,1,9718,0.0,11560,91.764,8947,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA5CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA185TC5AG6TGAGGA8AG45-G-A-G-G-C-G-A-G-G-G-G-C-G-G-C-G-A-C-T-G-G-T13TA72ACAG27AG5AG3CA4CT12CA49TGCT4GA11GC30GT1TC21TC48AG7GA25GC2AG18CA17G-4-ATA18AC4AC1GACT33CA23CG1TCTA35AG28AG12AT53AG1AG2TG38TC27TG13GT9GA13AG43AC28CA25TA2CT17TC5GA30GATC3TC8TC4AG54GA14ATAT7AG5GA17TC3CT13AG2TC29AG8AG38GA2GA5AC5CT2AG42-G-C-T2TCGA28TC10CTAT32TC1TC3AC20AG26AG5GA60CT7GA25AG38TC5AT16TC12GA28GA9AGAG34AG11GA50TA4AG3AG7AG21AG45GA91CT2TC20TC8AG101AG14AG50TC14TC17GA65GA5TC35AG14CA9AG11AG16CT22CT92GAGA2AC5AG59GA20AG23AG19AG100AGAT15TC20CA14AG26TCGC4AG32GA5TC18GA12CA30GA17GA24AT1GA6CT11CA17AG1TC26AG26GA35GA30GA3TC27CT12TC1AG2TC8AG26CG26TG11CT17AG20AG26TC23TC2AG2AG4GA2CT3CA18GA16GA6CA7AT11CT44AG20GA18CT26AC1GA19GA24GA14CT63TG13GAAG20AGCA15TA7GA3CT5CT39AG2AG54CT18CT29GA15AG61GA8AG11CT5CT6CT22GA3GA7AT2TC18AG5GA6AG21GA17TA29CAAG40AG8GT99AG40GA8CT42GA1CT26TC68GA14AG69CA20AGCT4CT3AGAG8AG7GT10CT12AC1CT26TC5GA8AT8AG6GA40CT30GA6AG5TG18CA24CT4TC5TC11GC14TG3AT2GT6GATCTA11CAAG13AG28GA13TC12GA10GT23GC4TC39AG15TC1TC5GA23AG7GA27AT9AGAG6AG3TC1CT7CA19AG13TCTA31TC14AG4AG16AG22GA57GA3CG46CT10AC52CG3CA3AG6GC13ATGT37CTTA2GCTC4TG26GACT22AT7GATA1AC32GA5TC2CGAT5AG5AC3GT39T-C-A-G-G-2GT1A-T-T-G-2GA18C-A-C-C-A-T-5AG21AG22AC4CA16TC23AG15TC14AG16CTCA7GA41TC15CGCT5AT21TC12AG25CT24TC36TG6TG6AG2GT1-G-A-A5TA5CA2AC5AG6TCAG1T-3GA1ATCG1GT-A6GATA6AG23TCGACG6AC4AG1AGAG4AG1AGAC14CT5AT3GA7GA2GA10GTGA6AC3AC7TA5TC2AG6TC10CT22AT7AG41AT12GA4AG1AC23ACCA34AG9GA23TC18AG5GA9ATAC9AG31TC1AC1AT2AG15TC12TC14TA2-C-C-G-T3TCTATG1-G1-G4GA3CAAG4AT2TGAT1GA3CT2AG1GA1C-A-T-12AG23GT3AGAC1GA1CA3GA4ACGA5GA5GA3TC1GACGAC18-G-G-A2GT12GA7TG14AG16TC3TC13CG21CTAT5AC1GA18ATA-T-G-6AGCT3CT3AG1-A-C-T-G-A-A-G-G-G-T-C-A4CATC5TAAGAGTA2-T-G-A3CA5TC5GA25GTAG6GA22TC10AGAT2GA7AG22TC1AGTC20GATACTCA2GAA-G-G-4CT1CACGCT1TC8TC26TC44GA11GA32AG4GA12AGAGCGGACA1GA6AT46GC26GA36CT29AC44GA20TC2CA16AG44AG9AG20TC5AC10ATAC3TC18GC1AG21GCATCT4TC2AT43GA14GA5GA24GA10CT18AT7CA14TCAT1AG5GT15AG4GA41GA2AG2CT7GA1TC5GA1TC11AC17AC36GAGTGT1AG14TC3TG2GA14CT4AG23GA28GA24AG12GA26GA5CT20GT11TC5TC11TC45AG2AGTC1GT12TG6CA23AG6GACT32TA5CG2GA11GA2AG26C-C-A-G-C-T-11ATGA23TC17CA6CG3TC13ACTC20GA17AG8GT10GC33AG1GC4AG1GA6GA41TC6CA2AG9AT15GA40TC15AGCTTC9TC1AG16TA25-A-A-G-A-T-A1-A-A-G-A-G-G-C-C-A-A-T-A10TC1GC1TA1TC3CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2TC2-G16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 +OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9718,636,59,675,9083,9718,0.0,708,89.151,567,plus,16TC6CA2AG9AT15GA40TC15AGCTTC9TC1AG16TA23-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G-C-C-A2GA10TC1GC1TA5CT7GTAG3AG2AT7GACTAG6AC1AG2AG8AG3AGTA5AG10AC17AGAT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA166 +OQ092467,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9936,9718,636,9104,9720,1,636,0.0,699,88.836,565,plus,14TC6CA1ACAG9AT15GA30GA9TC16CTTC9TC1AG16TA24-G-A-A-G-T-T-A-G-A-A-G-ATA1-C-C-A-A-C-A10TC1GC1TA1TC3CT7GTAG3AG2AT6GAGACTAG6AC1AG2AG8AG3AGTA5AG10AC18AT26AT3AG11CT1AG2-C2TG16AG9GTCT9TC5AC33GC15CT6CT19AG1CT1GA168 diff --git a/tests/expected-results-large/errors.json b/tests/expected-results-large/errors.json index 7ec8e1b..70d4d31 100644 --- a/tests/expected-results-large/errors.json +++ b/tests/expected-results-large/errors.json @@ -8,7 +8,7 @@ { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6323" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6322" }, { "sequence_name": "KX505501.1", @@ -17,33 +17,38 @@ }, { "sequence_name": "KX505501.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 195 positions." + "error": "DeletionInOrf", + "message": "Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893" + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon1 at 5969-6047 contains an internal stop codon at 6005" + "message": "Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004" }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 40 positions." + "message": "Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions." + }, + { + "sequence_name": "KX505501.1", + "error": "FrameshiftInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions." }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 96" + "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1116" + "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" }, { "sequence_name": "KX505501.1", @@ -64,13 +69,13 @@ "MN691959": [ { "sequence_name": "MN691959", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123" }, { "sequence_name": "MN691959", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" + "error": "InternalStopInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" } ], "MN692074": [ @@ -82,7 +87,7 @@ { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6551" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" }, { "sequence_name": "MN692074", @@ -92,32 +97,32 @@ { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpr at 5558-5843 can have maximum insertions 90, got 261" + "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893" + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 108" + "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 76 positions." + "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions." }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 204" + "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1131" + "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" }, { "sequence_name": "MN692074", @@ -130,18 +135,7 @@ "message": "Query sequence contains a long deletion." } ], - "MN692145": [ - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MN692145", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 231" - } - ], + "MN692145": [], "MN090335": [ { "sequence_name": "MN090335", @@ -150,13 +144,8 @@ }, { "sequence_name": "MN090335", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MN090335", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 282" + "error": "InternalStopInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" }, { "sequence_name": "MN090335", @@ -185,16 +174,6 @@ "error": "InternalStopInOrf", "message": "ORF gag at 789-2292 contains an internal stop codon at 822" }, - { - "sequence_name": "MN090376", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MN090376", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 252" - }, { "sequence_name": "MN090376", "error": "PackagingSignalDeletion", @@ -216,29 +195,8 @@ "message": "Sequence contains an internal inversion." } ], - "MK115581.1": [ - { - "sequence_name": "MK115581.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115581.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - } - ], + "MK115581.1": [], "MK115690.1": [ - { - "sequence_name": "MK115690.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MK115690.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - }, { "sequence_name": "MK115690.1", "error": "PackagingSignalDeletion", @@ -248,19 +206,14 @@ "sequence_name": "MK115690.1", "error": "MajorSpliceDonorSiteMutated", "message": "Query sequence has a mutated splice donor site, G-." + }, + { + "sequence_name": "MK115690.1", + "error": "Scramble", + "message": "Sequence is plus-scrambled." } ], "MK115571.1": [ - { - "sequence_name": "MK115571.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115571.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - }, { "sequence_name": "MK115571.1", "error": "PackagingSignalDeletion", @@ -273,16 +226,6 @@ } ], "MK115514.1": [ - { - "sequence_name": "MK115514.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115514.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - }, { "sequence_name": "MK115514.1", "error": "MajorSpliceDonorSiteMutated", @@ -290,16 +233,6 @@ } ], "MK115488.1": [ - { - "sequence_name": "MK115488.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115488.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - }, { "sequence_name": "MK115488.1", "error": "MajorSpliceDonorSiteMutated", @@ -307,16 +240,6 @@ } ], "MK115030.1": [ - { - "sequence_name": "MK115030.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MK115030.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 270" - }, { "sequence_name": "MK115030.1", "error": "Scramble", @@ -328,33 +251,12 @@ "message": "Sequence contains an internal inversion." } ], - "MK115498.1": [ - { - "sequence_name": "MK115498.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115498.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - } - ], + "MK115498.1": [], "MK115211.1": [ { "sequence_name": "MK115211.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6890" - }, - { - "sequence_name": "MK115211.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MK115211.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 252" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6889" }, { "sequence_name": "MK115211.1", @@ -392,13 +294,8 @@ "MK114705.1": [ { "sequence_name": "MK114705.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 74 positions." - }, - { - "sequence_name": "MK114705.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF nef at 8796-9417 contains out of frame indels that impact 122 positions." + "error": "DeletionInOrf", + "message": "Smaller ORF nef at 8795-9416 can have maximum deletions 30, got 186" } ], "MK114856.1": [ @@ -415,7 +312,7 @@ { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6326" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6325" }, { "sequence_name": "MK114856.1", @@ -425,32 +322,37 @@ { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains an internal stop codon at 5594" + "message": "Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5594" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5920" + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5919" }, { "sequence_name": "MK114856.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpu at 6259-6310 contains out of frame indels that impact 67 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434" + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8796-9417 contains an internal stop codon at 8853" + "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + }, + { + "sequence_name": "MK114856.1", + "error": "InternalStopInOrf", + "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8852" }, { "sequence_name": "MK114856.1", "error": "APOBECHypermutationDetected", - "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 4.399685326687554e-65)." + "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 3.639064030015132e-65)." } ], "MK115009.1": [ @@ -467,42 +369,37 @@ { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6350" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6349" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5373" }, - { - "sequence_name": "MK115009.1", - "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 5558-5843 can have maximum deletions 30, got 75" - }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5860" + "message": "Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5717" }, { "sequence_name": "MK115009.1", - "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 177" + "error": "InternalStopInOrf", + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434" + "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8796-9417 contains an internal stop codon at 8874" + "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" }, { "sequence_name": "MK115009.1", "error": "APOBECHypermutationDetected", - "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 1.3731449337509935e-41)." + "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 1.2040967664149076e-41)." }, { "sequence_name": "MK115009.1", @@ -518,27 +415,11 @@ "MK115387.1": [ { "sequence_name": "MK115387.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MK115387.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 279" - } - ], - "MK115491.1": [ - { - "sequence_name": "MK115491.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115491.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" + "error": "InternalStopInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" } ], + "MK115491.1": [], "MK116110.1": [ { "sequence_name": "MK116110.1", @@ -556,58 +437,16 @@ "message": "Query sequence has a mutated splice donor site, CC." } ], - "MK115527.1": [ - { - "sequence_name": "MK115527.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115527.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - } - ], + "MK115527.1": [], "MK114997.1": [ { "sequence_name": "MK114997.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6512" - }, - { - "sequence_name": "MK114997.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MK114997.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 270" - } - ], - "MK115518.1": [ - { - "sequence_name": "MK115518.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115518.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6511" } ], + "MK115518.1": [], "MK115065.1": [ - { - "sequence_name": "MK115065.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MK115065.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 270" - }, { "sequence_name": "MK115065.1", "error": "PackagingSignalDeletion", @@ -643,7 +482,7 @@ { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6425" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6424" }, { "sequence_name": "MK115464.1", @@ -653,57 +492,41 @@ { "sequence_name": "MK115464.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." + "message": "Smaller ORF tat_exon1 at 5829-6045 contains out of frame indels that impact 104 positions." }, { "sequence_name": "MK115464.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains out of frame indels that impact 104 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434" + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" }, { "sequence_name": "MK115464.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF nef at 8796-9417 contains out of frame indels that impact 393 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" }, { "sequence_name": "MK115464.1", - "error": "APOBECHypermutationDetected", - "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 5.391006513622446e-23)." - } - ], - "MK115530.1": [ - { - "sequence_name": "MK115530.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" }, { - "sequence_name": "MK115530.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" + "sequence_name": "MK115464.1", + "error": "APOBECHypermutationDetected", + "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 4.937891251407691e-23)." } ], + "MK115530.1": [], "MK115520.1": [ { "sequence_name": "MK115520.1", "error": "InternalStopInOrf", "message": "ORF pol at 2084-5096 contains an internal stop codon at 2198" }, - { - "sequence_name": "MK115520.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115520.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - }, { "sequence_name": "MK115520.1", "error": "MajorSpliceDonorSiteMutated", @@ -715,29 +538,8 @@ "message": "Sequence contains an internal inversion." } ], - "MK115503.1": [ - { - "sequence_name": "MK115503.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115503.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - } - ], + "MK115503.1": [], "MK115570.1": [ - { - "sequence_name": "MK115570.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115570.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - }, { "sequence_name": "MK115570.1", "error": "PackagingSignalDeletion", @@ -749,29 +551,8 @@ "message": "Query sequence has a missing splice donor site, --." } ], - "MK115509.1": [ - { - "sequence_name": "MK115509.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115509.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - } - ], + "MK115509.1": [], "MK115702.1": [ - { - "sequence_name": "MK115702.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 74 positions." - }, - { - "sequence_name": "MK115702.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" - }, { "sequence_name": "MK115702.1", "error": "PackagingSignalDeletion", @@ -807,84 +588,42 @@ { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6551" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5151" }, - { - "sequence_name": "MK115095.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5860" + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859" }, { "sequence_name": "MK115095.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpu at 6259-6310 contains out of frame indels that impact 43 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 contains an internal stop codon at 8434" + "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" }, { "sequence_name": "MK115095.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 213" + "error": "InternalStopInOrf", + "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" }, { "sequence_name": "MK115095.1", "error": "APOBECHypermutationDetected", - "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 9.460464921885922e-40)." - } - ], - "MK115490.1": [ - { - "sequence_name": "MK115490.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115490.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" - } - ], - "MK115576.1": [ - { - "sequence_name": "MK115576.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MK115576.1", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 243" + "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 8.33506116803153e-40)." } ], + "MK115490.1": [], + "MK115576.1": [], "OQ092466": [ - { - "sequence_name": "OQ092466", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "OQ092466", - "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 195" - }, - { - "sequence_name": "OQ092466", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 261" - }, { "sequence_name": "OQ092466", "error": "MajorSpliceDonorSiteMutated", @@ -911,21 +650,6 @@ } ], "OQ092462": [ - { - "sequence_name": "OQ092462", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "OQ092462", - "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 195" - }, - { - "sequence_name": "OQ092462", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 255" - }, { "sequence_name": "OQ092462", "error": "PackagingSignalDeletion", @@ -950,16 +674,6 @@ } ], "OQ092467": [ - { - "sequence_name": "OQ092467", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "OQ092467", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 237" - }, { "sequence_name": "OQ092467", "error": "PackagingSignalDeletion", diff --git a/tests/expected-results-large/holistic.json b/tests/expected-results-large/holistic.json index a84c4dc..f1d654f 100644 --- a/tests/expected-results-large/holistic.json +++ b/tests/expected-results-large/holistic.json @@ -4,23 +4,23 @@ "hypermutation_probablility": 0.7087072014754221, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 1997, - "blast_sseq_coverage": 0.2498199403230785, + "blast_sseq_coverage": 0.2498456472525211, "blast_qseq_coverage": 1.2158237356034052, - "blast_sseq_orfs_coverage": 0.17661753684736448, + "blast_sseq_orfs_coverage": 0.17663960024984385, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 4 }, "MN691959": { "qlen": 9493, - "hypermutation_probablility": 0.19593905853945925, + "hypermutation_probablility": 0.19667690182893238, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9493, - "blast_sseq_coverage": 1.0816956477003807, + "blast_sseq_coverage": 1.0817040543321672, "blast_qseq_coverage": 1.1086063415148004, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MN692074": { @@ -28,143 +28,143 @@ "hypermutation_probablility": 0.36378645339477633, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 4178, - "blast_sseq_coverage": 0.5041670953801831, + "blast_sseq_coverage": 0.5042189750977567, "blast_qseq_coverage": 1.1728099569171853, - "blast_sseq_orfs_coverage": 0.41144141893579816, + "blast_sseq_orfs_coverage": 0.4114928169893816, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 4 }, "MN692145": { "qlen": 9689, - "hypermutation_probablility": 0.1661041079701131, + "hypermutation_probablility": 0.1672411051048176, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9689, - "blast_sseq_coverage": 1.1304660973351168, + "blast_sseq_coverage": 1.130479522535501, "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MN090335": { "qlen": 9069, - "hypermutation_probablility": 0.1754017863888554, + "hypermutation_probablility": 0.1771850809736527, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9069, - "blast_sseq_coverage": 0.9842576396748637, + "blast_sseq_coverage": 0.9842560197571517, "blast_qseq_coverage": 1.0603153600176425, - "blast_sseq_orfs_coverage": 1.0003747189607795, + "blast_sseq_orfs_coverage": 1.0003747657713928, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MN090376": { "qlen": 8985, - "hypermutation_probablility": 0.026007919521734202, + "hypermutation_probablility": 0.026415767987601813, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 8985, - "blast_sseq_coverage": 0.9784957300133759, + "blast_sseq_coverage": 0.9784935171846059, "blast_qseq_coverage": 1.0604340567612687, - "blast_sseq_orfs_coverage": 0.9943792155883088, + "blast_sseq_orfs_coverage": 0.9943785134291068, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115581.1": { "qlen": 9495, - "hypermutation_probablility": 0.6897199265079494, + "hypermutation_probablility": 0.6919440876652894, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9495, - "blast_sseq_coverage": 0.9870357032616525, + "blast_sseq_coverage": 0.987034369211772, "blast_qseq_coverage": 1.0046340179041602, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115690.1": { "qlen": 9689, - "hypermutation_probablility": 0.05065930954004094, + "hypermutation_probablility": 0.051230576250981485, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9689, - "blast_sseq_coverage": 0.988167506945159, - "blast_qseq_coverage": 0.9949427185468056, + "blast_sseq_coverage": 1.004630582424367, + "blast_qseq_coverage": 1.0113530808132933, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, - "blast_n_conseqs": 2 + "orfs_end": 8794, + "blast_n_conseqs": 3 }, "MK115571.1": { "qlen": 9394, - "hypermutation_probablility": 0.8012585672082311, + "hypermutation_probablility": 0.8029570594372466, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9394, - "blast_sseq_coverage": 0.9866241382858318, + "blast_sseq_coverage": 0.9866227618851615, "blast_qseq_coverage": 1.0113902490951672, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115514.1": { "qlen": 9382, - "hypermutation_probablility": 0.6458974386368621, + "hypermutation_probablility": 0.6482462132632603, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9382, - "blast_sseq_coverage": 0.9864183557979216, + "blast_sseq_coverage": 0.9864169582218564, "blast_qseq_coverage": 1.0173736943082499, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115488.1": { "qlen": 9623, - "hypermutation_probablility": 0.6511896911074662, + "hypermutation_probablility": 0.6534999185838631, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9623, - "blast_sseq_coverage": 1.0255170285008746, + "blast_sseq_coverage": 1.0255196542498457, "blast_qseq_coverage": 1.0325262392185388, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 6 }, "MK115030.1": { "qlen": 9126, - "hypermutation_probablility": 0.031598631869680704, + "hypermutation_probablility": 0.032014462397289556, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9126, - "blast_sseq_coverage": 0.9940323078506019, + "blast_sseq_coverage": 0.994031693764149, "blast_qseq_coverage": 1.0655270655270654, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115498.1": { "qlen": 9461, - "hypermutation_probablility": 0.8339748776671196, + "hypermutation_probablility": 0.83547963060225, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9461, - "blast_sseq_coverage": 0.9866241382858318, + "blast_sseq_coverage": 0.9866227618851615, "blast_qseq_coverage": 1.0080329774865235, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115211.1": { "qlen": 9032, - "hypermutation_probablility": 0.11689558806708, + "hypermutation_probablility": 0.11818291879607423, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9032, - "blast_sseq_coverage": 0.9950612202901533, + "blast_sseq_coverage": 0.995060712080675, "blast_qseq_coverage": 1.0598981399468557, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115158.1": { @@ -181,14 +181,14 @@ }, "MK114705.1": { "qlen": 9411, - "hypermutation_probablility": 0.14449377496074622, + "hypermutation_probablility": 0.14584270737492833, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9411, - "blast_sseq_coverage": 1.0980553554892478, + "blast_sseq_coverage": 1.098065445564931, "blast_qseq_coverage": 1.122622463075125, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 6 }, "MK114856.1": { @@ -196,11 +196,11 @@ "hypermutation_probablility": 1.0, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9477, - "blast_sseq_coverage": 1.0485646671468258, + "blast_sseq_coverage": 1.0485696645400289, "blast_qseq_coverage": 1.0812493405085997, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 4 }, "MK115009.1": { @@ -208,35 +208,35 @@ "hypermutation_probablility": 1.0, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9207, - "blast_sseq_coverage": 0.9965016977055252, + "blast_sseq_coverage": 0.9965013377238114, "blast_qseq_coverage": 1.0590854784403172, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115387.1": { "qlen": 9136, - "hypermutation_probablility": 0.5412311092694289, + "hypermutation_probablility": 0.5436355526687852, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9136, - "blast_sseq_coverage": 0.9796275336968824, + "blast_sseq_coverage": 0.9796254373327845, "blast_qseq_coverage": 1.040936952714536, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115491.1": { "qlen": 9422, - "hypermutation_probablility": 0.8951015182445495, + "hypermutation_probablility": 0.8961809048805741, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9422, - "blast_sseq_coverage": 1.003704084782385, + "blast_sseq_coverage": 1.0037044659394938, "blast_qseq_coverage": 1.0299299511780937, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK116110.1": { @@ -253,50 +253,50 @@ }, "MK115527.1": { "qlen": 9481, - "hypermutation_probablility": 0.7689834393883834, + "hypermutation_probablility": 0.770862998910788, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9481, - "blast_sseq_coverage": 0.986727029529787, + "blast_sseq_coverage": 0.9867256637168141, "blast_qseq_coverage": 1.0056956017297753, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK114997.1": { "qlen": 9055, - "hypermutation_probablility": 0.054959132555391754, + "hypermutation_probablility": 0.05560625344150194, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9055, - "blast_sseq_coverage": 0.9784957300133759, + "blast_sseq_coverage": 0.9784935171846059, "blast_qseq_coverage": 1.0516841524019878, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115518.1": { "qlen": 9537, - "hypermutation_probablility": 0.6385326595592609, + "hypermutation_probablility": 0.6408152618300496, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9537, - "blast_sseq_coverage": 0.9847720958946393, + "blast_sseq_coverage": 0.9847705289154147, "blast_qseq_coverage": 0.9996854356715948, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115065.1": { "qlen": 9214, - "hypermutation_probablility": 0.033517722768753644, + "hypermutation_probablility": 0.033954952452739495, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9214, - "blast_sseq_coverage": 1.0080255170285009, + "blast_sseq_coverage": 1.0080263428689031, "blast_qseq_coverage": 1.069459518124593, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 6 }, "MK115464.1": { @@ -304,83 +304,83 @@ "hypermutation_probablility": 1.0, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9663, - "blast_sseq_coverage": 0.9838460746990431, + "blast_sseq_coverage": 0.9838444124305412, "blast_qseq_coverage": 0.9893407844354756, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115530.1": { "qlen": 9544, - "hypermutation_probablility": 0.5789377103398377, + "hypermutation_probablility": 0.5812621948015355, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9544, - "blast_sseq_coverage": 0.9866241382858318, + "blast_sseq_coverage": 0.9866227618851615, "blast_qseq_coverage": 0.9992665549036044, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115520.1": { "qlen": 9589, - "hypermutation_probablility": 0.5200353682902832, + "hypermutation_probablility": 0.5225247969864292, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9589, - "blast_sseq_coverage": 0.9787015125012861, + "blast_sseq_coverage": 0.9786993208479111, "blast_qseq_coverage": 0.987902805297737, - "blast_sseq_orfs_coverage": 1.012115913065201, + "blast_sseq_orfs_coverage": 1.0121174266083697, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115503.1": { "qlen": 9617, - "hypermutation_probablility": 0.4263025132504157, + "hypermutation_probablility": 0.42870398270204335, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9617, - "blast_sseq_coverage": 0.9870357032616525, + "blast_sseq_coverage": 0.987034369211772, "blast_qseq_coverage": 0.9953207861079338, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115570.1": { "qlen": 9485, - "hypermutation_probablility": 0.738578434638724, + "hypermutation_probablility": 0.7406166892211931, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9485, - "blast_sseq_coverage": 0.9866241382858318, + "blast_sseq_coverage": 0.9866227618851615, "blast_qseq_coverage": 1.0057986294148655, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115509.1": { "qlen": 9353, - "hypermutation_probablility": 0.7866198309713798, + "hypermutation_probablility": 0.7883768413537747, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9353, - "blast_sseq_coverage": 0.9866241382858318, + "blast_sseq_coverage": 0.9866227618851615, "blast_qseq_coverage": 1.0197797498128942, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115702.1": { "qlen": 9098, - "hypermutation_probablility": 0.14401391767451666, + "hypermutation_probablility": 0.1454272422215308, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9098, - "blast_sseq_coverage": 0.987447268237473, + "blast_sseq_coverage": 0.9874459765383824, "blast_qseq_coverage": 1.0596834469114091, - "blast_sseq_orfs_coverage": 1.019860104921309, + "blast_sseq_orfs_coverage": 1.0198625858838226, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 4 }, "MK115095.1": { @@ -388,47 +388,47 @@ "hypermutation_probablility": 1.0, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9137, - "blast_sseq_coverage": 0.9907397880440375, + "blast_sseq_coverage": 0.9907388351512657, "blast_qseq_coverage": 1.060085367188355, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 2 }, "MK115490.1": { "qlen": 9347, - "hypermutation_probablility": 0.8863248655310947, + "hypermutation_probablility": 0.8875203448314265, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9347, - "blast_sseq_coverage": 0.9848749871385946, + "blast_sseq_coverage": 0.9848734307470673, "blast_qseq_coverage": 1.0204343639670483, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MK115576.1": { "qlen": 9266, - "hypermutation_probablility": 0.818189227062389, + "hypermutation_probablility": 0.8197662757563093, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9266, - "blast_sseq_coverage": 0.9917687004835889, + "blast_sseq_coverage": 0.9917678534677917, "blast_qseq_coverage": 1.0342110943233327, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "OQ092466": { "qlen": 9686, - "hypermutation_probablility": 0.3876036547663967, + "hypermutation_probablility": 0.3858261890626, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9686, - "blast_sseq_coverage": 1.1015536577837226, + "blast_sseq_coverage": 1.1015641078411196, "blast_qseq_coverage": 1.1192442700805285, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "OQ092463": { @@ -457,14 +457,14 @@ }, "OQ092462": { "qlen": 9714, - "hypermutation_probablility": 0.10777665573070194, + "hypermutation_probablility": 0.10883643311676816, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9714, - "blast_sseq_coverage": 1.130671879823027, + "blast_sseq_coverage": 1.1306853261988064, "blast_qseq_coverage": 1.1301214741610048, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "OQ092464": { @@ -481,14 +481,14 @@ }, "OQ092467": { "qlen": 9936, - "hypermutation_probablility": 0.6416537859942263, + "hypermutation_probablility": 0.6438715160567257, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9936, - "blast_sseq_coverage": 1.1308776623109373, + "blast_sseq_coverage": 1.1308911298621116, "blast_qseq_coverage": 1.0962157809983897, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-large/intact.fasta b/tests/expected-results-large/intact.fasta index e69de29..2d494f4 100644 --- a/tests/expected-results-large/intact.fasta +++ b/tests/expected-results-large/intact.fasta @@ -0,0 +1,1754 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA +>MK115581.1 +AAATTGGGACGTTCGCCTACGCAAGCGAAAATTTCTCTACGTAGCCACCTTTCCCGATTA +ACGTCAGAACCCTAAAATTAAAATAAATCCTAGCGGCCGACCGACTCTGGTAACTAGAGA +TCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC +TCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACA +GACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAATCATCTT +AGAGTGGCGCCCGAACGACTCTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGT +GGCGCCCGCGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCG +AGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGACT +CTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGACACAGGTACTA +GAGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG +CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAG +CGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAG +ATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATT +TAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACAT +CAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAG +AACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGG +TACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAA +AGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCA +TAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATG +CATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAG +CATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGAC +ATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATA +GATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAA +GTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATC +CACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAG +TAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTA +GAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAA +AAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTT +TAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGG +GGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTA +ATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATT +GTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGA +AATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAG +GGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGC +CAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGA +AGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCA +GCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGG +AGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGAT +AGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTG +TGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAG +AAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGT +ACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGA +AGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTC +AAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAG +TACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTG +GGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGT +ACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATAC +TGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGT +GCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTT +AGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTA +TGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACA +TCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCT +TTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGA +AAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAG +TCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGC +ACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGA +AATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGA +AGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAA +TCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATT +AACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAA +ATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGC +CACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCA +ATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAG +AGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTC +CCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGA +TTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGC +ACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAA +GGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGT +AGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGC +CCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATAT +ACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGA +GGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCT +AGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGT +TATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATG +GCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGC +CGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCA +AGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCA +GGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAA +AGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCT +ACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAG +GGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGC +AGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCAT +TAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGA +TTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGAT +GGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCC +CACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAG +AATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAG +TTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAAT +CTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAG +GACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGA +GAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACC +AGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGA +ACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACA +TATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCA +ACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCC +ACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAG +GAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCC +AAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGC +GACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAG +TATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAA +TAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAA +GGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTG +AAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATG +TTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTA +TGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAG +GCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTA +GGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATG +CATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCA +CTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAG +GAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGA +AATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAT +GATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCA +AAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTA +AAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAA +TGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCA +GAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTA +CATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGT +ATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGA +CAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAA +AAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGAC +CCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACA +CAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGA +AACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAA +GCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTA +CTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGA +GATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCA +TTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTG +GGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCG +TCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAAC +AATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATC +AAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTG +GGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGT +TGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGA +GAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAG +GAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTT +AACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATA +GGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCA +CCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATC +GAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTG +GCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGAC +TTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTC +AAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGC +TTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTA +CAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGG +GCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGT +AAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGA +CCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGC +CTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCC +TTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGG +GGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTA +CAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATA +TCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCA +AGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAA +AGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAA +GCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTG +GGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGC +TGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGC +CTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTG +CACTCAAGGCAAGCT +>MK115498.1 +AACACGGAATGGGAGATAAGCAGCATCTCTATCGGCGCGGCGAGATCTGACACTGGTAAC +TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC +CCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCCTAAATCTC +TAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTG +GCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC +TCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGAC +TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAA +CTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACTAGAGATCCCT +CACCCTAGATCTCTAGCAGTGGCGCCCGCGAAGGCACTAGGACCTGAAAGCGAAAGTAAA +ACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGA +GGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGA +GAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATT +CGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGG +GAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAA +ATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTT +AATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAA +GCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCA +GCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAG +GGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTA +GAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCC +ACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAA +ATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAT +GCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACT +ACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGA +GAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCT +ACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGG +TTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAA +ACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCA +GCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAA +GCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGA +GGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCAC +ATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGA +CATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCC +CACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAA +GAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGAC +AAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAA +TAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTAT +TAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTT +TTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAG +GTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGC +TTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGC +CAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCAT +TAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAA +ATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAAT +TAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAA +TACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATG +CATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTA +GTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGA +AAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGC +AAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAG +AAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGAC +TTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAAC +TCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTG +TCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGA +TTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTAC +CACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAG +TACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCA +ATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAAT +ATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAA +AGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATAC +AAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGT +GGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCA +TAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCA +AAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAA +ATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAA +ACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTG +AATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGG +CATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTA +CTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGA +AATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAA +AAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAG +TAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCC +TGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAG +GGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATAC +ATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAG +GGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCA +TGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGA +CAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGT +ATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTAC +AGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCAC +TTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATA +ATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAAC +AGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGT +TTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCAC +TATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGA +TTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAG +GGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCA +GACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCC +ATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGC +TCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTA +CCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCAC +AGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGG +TTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATG +GGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTC +ATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAA +ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACT +CCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAA +AAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAA +GGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCT +CTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGG +ACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATT +GATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAA +TTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGC +TACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACAC +CACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGC +CACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGAC +AGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAA +TTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAA +TTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGA +AGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGA +ATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATAC +ATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCC +AATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAA +GTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAA +GCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAAT +TAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTAT +ACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGG +AAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCT +TAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATA +TGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCA +TACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTAC +TTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATG +CAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCC +CATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGG +TGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTG +GAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCAC +CAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTT +CCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGT +ACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTAT +TGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAG +AGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTC +TGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCT +GAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACAC +AGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGA +ATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCT +GTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTT +TGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGAC +CCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGA +AAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGA +CCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAAC +AAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCT +CCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGC +CATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGC +TCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGG +GGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGAC +GAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAG +CAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAG +AAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTT +TCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAA +TTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACT +TCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGT +GGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCT +TGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGA +AGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACA +AAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAG +GTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGC +GTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCT +AACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115491.1 +CTGATTTGCTGTGGCGGCCGCAAGGACTCAAGTAGGTAACTATAGAAACCCCCCACCAAT +TCTCTAGCAGTGGCGTCCGACGCTGGCCAAAACTCTCTAGCAGTGGCGCCCGAACAGACT +CTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAG +ATCCCAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATC +TCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTG +GCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCGCCC +GACTCTGGTAACTAGAGATCCCTCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTA +GAGACTCAGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACG +CCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAA +TATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGA +AAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTA +ACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCAT +CCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATT +GTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAG +AGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAA +ACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCC +TATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAG +AAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCA +TGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATG +AGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCC +AGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAA +TAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAA +TCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAAC +AAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTG +AGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGA +ATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGA +TGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAA +TGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAA +AGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCC +CTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAG +AGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACT +TCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAG +AGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTT +CCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAA +AGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGG +AAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGA +TCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTAC +ACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCC +CATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGT +TAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAAT +GGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATT +TGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAA +TAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAA +AAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGA +TAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGG +GATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCA +AAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTA +TCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAA +AATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACA +TCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGT +ACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGT +GGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAA +ACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCT +AGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCC +ATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAAT +TTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCA +CACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGT +AATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATG +GTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCC +CTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTA +TGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAG +AGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGC +AATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATA +TACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGAT +AATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGG +AATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATT +TCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGC +AATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGA +TAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATG +GCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAG +TGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCT +CCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTT +CACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCAT +TCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAAT +TATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATT +CATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGT +AGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCA +AAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCT +TCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCC +AAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGT +GGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATG +TTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAA +TAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGG +GCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAA +AAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATT +ACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTC +CTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAA +AAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAG +AGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATG +GACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTG +GCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGA +GGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACA +TAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGAC +TAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTA +AAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATG +GCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATT +CTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAG +GATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATA +GGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAA +AAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGG +GGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACA +GTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGAT +GCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACA +GACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAA +AATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAG +CCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACT +AATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTC +AATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTT +GATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCA +GTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCC +CCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGT +AAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTA +CTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAAC +AATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCC +AACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGA +GCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAAT +ACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTT +AATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAA +TTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGG +AATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAAC +AGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGT +TCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAG +ACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATAT +AAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTG +CAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCA +GGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCT +GGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTG +CAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATAC +CTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACT +GCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATG +ACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATT +GAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGG +GCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATA +ATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAAT +AGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGA +CCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTT +CGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTC +CTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGA +CGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAG +CTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACA +GATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGA +ATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAG +TGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGG +GGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGC +AGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTT +TCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAG +CCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGA +TATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACAC +ACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGT +GGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCA +TGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATT +TCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTT +CTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGG +GAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCT +CTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAA +GCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC +GCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACTCTGG +TA +>MK115527.1 +ACCTATTACAGCCCATAAAGAGGAGAAACGAACATAAAGCTAGTGCAAACCTGACTGCCC +GAGGCAGGGAGCTAGAGTTAGGTAACTAAAGCTCAATCACTAGCGCTCGAGCATGAGGGA +CTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACATAAATCTCT +AGCAGTGGCGCCCTAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAG +CAGTGGCGCCCGAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCA +GTGGCGCCCGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGA +ACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAAC +ATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACAT +GACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGCGCGACATGAGGCTCGGT +AACTAGAGATCCTCAGTAAATCCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAA +GCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGAC +TAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAAT +TAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAAC +ATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAA +CATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAG +AAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAC +AGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGA +AAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACC +CCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAA +ATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTT +CAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGG +GACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGG +ATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGG +GAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATA +ATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAA +TAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCT +TTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGG +TAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTA +TTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAG +TGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAG +CTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCA +ATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTT +GGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTT +TAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAG +AGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTC +AGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTG +GCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATAC +AGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAAT +GATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAAT +CTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGG +AAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAAC +TGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGAC +AGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAAT +TTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGA +CAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTT +TTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAAC +AGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTA +TACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAA +TGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAAT +CTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTT +GTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACA +ACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATT +CCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCC +AGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGC +AAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAA +AGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAG +GGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGC +AGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAA +AAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACA +ATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCC +TAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCA +AGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTA +CCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAA +TAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTAT +CTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCA +GGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCA +AGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAA +AAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACA +AGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAA +GGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAA +TATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGG +AGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACA +TCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGA +AGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAG +ATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAA +GGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAG +TCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGA +TCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAG +AAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGA +CCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTA +CAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGG +GGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAAT +CATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGA +GGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAG +GATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACA +TCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAA +GAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACAC +AAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAG +AATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAG +CAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAA +AGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGC +ACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGA +GGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACA +ACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCT +GCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGT +GCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACC +CAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATT +GCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGAC +AGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +TAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAA +TAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAA +AAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGA +GTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGG +ATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCT +GTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACA +GAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAA +GTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAG +ATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACC +CCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGT +GAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATA +AGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGAT +AATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGT +CCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATT +CTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTA +CAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTA +GCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATA +GTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAA +AGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATA +AGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTT +GAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGG +GACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACA +ACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGAT +GGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGA +AAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGG +TTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGA +GGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAG +CCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCA +GTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCA +GCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAA +AACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGC +ATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGC +CTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCT +AGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAA +AGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAG +CAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGG +TTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTG +ATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATAT +TCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGA +ATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTC +TTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGA +GACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATC +CTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATT +AGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTA +GTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAA +AGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGC +TGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCG +AGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTG +CGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGT +GCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAA +GGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGT +CTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAG +ATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAA +TCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGA +AAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGA +GAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCG +CTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGA +TGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTG +AGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCC +T +>MK115518.1 +TCCATTGCCCAGTTGTATCAGCTCAAGCTAGTTTCGCACAGAACCCTCTTACAAGAGCTG +CCGCCGAGACCGATACTAGTAGCGAGCGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCT +AGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGG +CGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAAC +TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACCTCCTAAATCTCTAGCAGTGG +CGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTC +CTAAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCCTCCTAAATCTCT +AGCAGTGGCGCCCGAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGC +CCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAACTCTGGACT +CTGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG +CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGC +GGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGA +TGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTT +AGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATC +AGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGA +ACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGT +ACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAA +GGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCAT +AGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGC +ATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGC +ATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACA +TCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAG +ATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAG +TGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCC +ACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGT +AAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAG +AGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAA +AAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTT +AAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGG +GGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAA +TGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTG +TGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAA +ATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGG +GAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCC +AACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAA +GCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAG +CGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGA +GCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATA +GGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGT +GGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGA +AATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTA +CCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAA +GAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCA +AAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGT +ACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGG +GAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTA +CTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACT +GCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTG +CTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTA +GAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTAT +GTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACAT +CTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTT +TGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAA +AAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGT +CAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCA +CTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAA +ATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAA +GTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAAT +CTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTA +ACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAA +TTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCC +ACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAA +TTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGA +GAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCC +CTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGAT +TCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCA +CAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAG +GAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTA +GACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCC +CAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATA +CCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAG +GCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTA +GAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTT +ATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGG +CCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCC +GCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAA +GGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAG +GCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAA +GGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTA +CAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGG +GACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCA +GTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATT +AGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGAT +TAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATG +GTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCC +ACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGA +ATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGT +TGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATC +TGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGG +ACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAG +AAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCA +GAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAA +CTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACAT +ATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAA +CAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCA +CAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGG +AAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCA +AGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCG +ACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGT +ATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAAT +AGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAG +GATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGA +AGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGT +TGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTAT +GGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGG +CACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAG +GATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGC +ATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCAC +TCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGG +AGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAA +ATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATG +ATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAA +AGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAA +AGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAAT +GTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAG +AAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTAC +ATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTA +TCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGAC +AAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAA +AATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACC +CAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACAC +AGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAA +ACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAG +CAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTAC +TATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAG +ATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCAT +TAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGG +GAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGT +CAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACA +ATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCA +AGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGG +GAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTT +GGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAG +AAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGG +AAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTA +ACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAG +GTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCAC +CATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCG +AAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGG +CACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACT +TACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCA +AACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCT +TATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTAC +AAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGG +CATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTA +AGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGAC +CTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCC +TGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCT +TTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGG +GGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTAC +AACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATAT +CCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAA +GGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAA +GAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAG +CATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGG +GGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCT +GCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCC +TGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115530.1 +TAACTAGCAGTCCCCCGCGGCGGCCCGGCAATGGCTGGACCCGACCCCCCAACCCCTGCC +GCCGGCGCCGACTATCGAGACTGGTAACCCCCCACCCCCCAACCCTAGCCGCGCGGCCCG +ACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACAGACTCTG +GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGC +AGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCATCCCAAATCTCTAGCAGTGG +CGCCCGAACAGACTCTGGTAACTAGAGATCCCCAGCTCTAGCAGTGGCGCCCGCGACTCT +GGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAG +CAGTGGCGCCCGACTGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGG +CCCCGAGCTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACA +GACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC +TGGTAACTAGAGATCCCTACTCCAATCTCAGCAGCTCTCTCGGCGCAGGACTCGGCTTGC +TGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTT +GACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAA +AATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAA +AACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAG +AAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGAT +CAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGA +TACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTA +AGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATT +ACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTT +TAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGT +TTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGG +GGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAAT +GGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAA +GGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAA +ATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATA +AAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAAC +CCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGG +AGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGA +CTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAG +GAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATT +CAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTT +TCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCT +GTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATT +TTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGAC +CAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCT +CTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCT +TTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGA +TACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAA +AATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGA +AATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAAT +TGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGA +AACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATT +GACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAA +AATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAA +AGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGA +CTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGT +AACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAA +GTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTA +CAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAA +AATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGA +TTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAG +ACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCC +ATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACT +GCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTG +GGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAAC +CAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAA +CAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAAT +AGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATT +TAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAA +ACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAAC +TCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTG +GCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATG +GTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGC +TAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGT +TATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTT +GCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCAT +TCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAAT +AAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGA +ACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGA +TAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTT +TAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAA +AGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTAC +ACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGC +AGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGG +GAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGT +TAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCA +AAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAG +AGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAA +AAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAAC +AGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTA +TTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGA +AGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAA +AATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGA +TGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTA +AAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTAC +ACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAG +AAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCA +CACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTT +CAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATC +AAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACAC +CAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACG +AGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTT +AGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGG +ACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAAC +CCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCAT +TGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGC +ACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTC +ATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGA +GACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +AAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAG +CAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGAC +AAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATG +AGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTG +GGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTA +CCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACC +ACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAA +GAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAA +CAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTA +ACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGT +AGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAA +ATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATA +GATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCC +TGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCG +ATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACA +GTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGT +TTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATA +ATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATG +AAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGAT +ATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTA +GTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGA +GGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAAT +ACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTA +GATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTA +GGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACA +GGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGA +GGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATT +GAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGA +GCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGC +GCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAG +CAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGG +GGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAG +CGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAAT +GCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGG +GAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAAC +CAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAAT +TGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGA +TTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGA +TATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAA +GGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGA +TTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTG +AGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAA +ATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCT +ATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAA +GTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTG +GAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCC +TGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATC +TCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGA +TTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCA +GGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGA +AAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTG +GGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGAC +CAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGC +CAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCC +GGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCG +AGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTT +TCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTC +AGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGAT +CTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT +GCCT +>MK115503.1 +GCTCTCGAACAGTGCGGACTCTGGTAACTAGAGATCCCTCAGCTCTAGCAGTGGCGCCCG +AACAGAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCTAAATCTCTAG +CAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTACTCTAGCAGTGGCGCCCAGA +ACATGGACTCTGGTAACTAGAGACCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGT +AACTAGAGATCCCTCCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAG +ATCCCTCCTAACTCTAGCAGTGCGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGC +AGTGGCGCCCGACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCG +CCCGAGAACAGATCTGGTAACTAGAGCCCTACTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACT +AGAGATCCTCCTAAATCTCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC +CCTCAGCTCTAGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGGGACTCTGGT +AACTAGAGATCCTCACTAAATCTAGCAGTGGCGCCGAGAGGAGACTCTCTCGGCGCAGGA +CTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGA +AAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATT +AAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAA +ATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCC +TGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCT +TCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGT +ACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCA +AAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAG +CAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATC +ACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGT +CATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCT +AAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGA +AGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGAT +GAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGC +ATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTT +GGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGG +ACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCA +AGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCC +AGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGAC +AGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAG +CCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGAT +TGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAG +GAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAG +ACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCT +TCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGAC +AATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCT +CAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAA +GCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAA +TGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAG +ATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCT +GTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATT +AGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAA +CAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAA +AAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCT +ATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAG +AGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAG +AAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAA +GAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATT +AGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGT +AGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAA +TACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATA +GAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAG +AAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAG +CCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGA +AAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTC +CTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAA +CTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCA +AAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTAT +CAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACT +AATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATA +TGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGG +GCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTA +GTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTA +GATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGA +AGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATT +TATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACA +TTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATA +GAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATT +GGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTA +GATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATG +GCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAA +TGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAA +CTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGA +TATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTG +AAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACC +AGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCC +TACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATA +GGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATC +CACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGAT +ATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAAT +TTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTC +TGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGG +AGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCA +AGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTC +AAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAG +TTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCT +GAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAG +GAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTT +TGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAG +GTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGC +ATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGA +TAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACA +TTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTC +CATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCC +ATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGC +AGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGA +GCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAA +GTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAG +GAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCT +ATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATT +AGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAA +AATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGA +CAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCA +CCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCT +ATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTA +AAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACC +CCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATA +ACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCAT +GTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATA +CCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATA +TCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATG +TAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCA +TTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGG +CTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAA +ATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGT +TAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATG +CTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACA +ACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCA +TAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTT +TAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATC +ACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTT +TCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATG +CTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGT +GGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCAT +CAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCT +TCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAG +TAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAA +GAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAA +GCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTA +TAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAAC +TCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAC +AGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTG +TGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCT +GGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAA +AGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAA +GTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGA +TAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAG +TTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCG +ACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGAT +TAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCT +GCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCA +GGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAA +AGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATA +GGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAA +GACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGG +GGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTG +GGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCT +ACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCA +GTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCAC +TTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATC +CTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCA +GGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAG +CCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGG +ATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCAT +CACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTAC +AAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGT +GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGG +TTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCT +CAATAAAGCTTGCCTTG +>MK115509.1 +CCCCAAATCTCTAGCCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCCCAAATCTCT +AGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCC +TAAATCTCTAGCAGTGGCGCCCGAAGACTCTGGTAACTAGAGATCCCTCACCCTAAATCT +CTAGCAGTGGCGCCCGCTCGTACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCACCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTG +GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAAC +TAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTACTAGAGA +TCCCTCAAATCAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCAC +AGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAG +GCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCA +TGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTA +TGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAG +GGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTT +AAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAA +GACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCA +CAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTG +CAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGG +GTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTA +TCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAA +GCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTG +CATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGAC +ATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCT +ATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGG +ATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGAC +TATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAAT +TGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAA +GCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGA +CCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTA +ATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGC +AAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGT +GGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAA +ATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACA +GCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAG +GAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGAC +CCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAG +ATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGG +GAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGAC +ACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATC +TGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAG +TAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAA +AAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAA +TTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTA +AATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAG +TTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGG +ATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCAT +TTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGC +CACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGC +CTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAG +GATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGT +TAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGA +TGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAG +ACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGA +TTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAA +CAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTT +TAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTAC +AGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGA +AAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAG +AGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTA +GACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCT +GGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAG +AGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAA +CTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAA +CGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGG +GATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAAC +CAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAA +AAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACA +AACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAG +AAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCC +CTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCA +TGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAG +GGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTC +CAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAG +TAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCT +GTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAG +TAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTG +AACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGG +GGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAA +CTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACA +GCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAG +TAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGG +ATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGA +ACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTT +TATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTA +GGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGG +CATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGAC +CCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCT +ATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACAT +AACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGA +AAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAG +ACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTA +AGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCT +ATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAAC +TGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGA +GGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGT +CAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTT +TGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGA +AGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATAT +GTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCA +ATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATA +GACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGG +GATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGAT +GATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAA +AGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACA +TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATT +GGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGA +GGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG +TGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGG +AAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAA +GATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAA +TACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGT +ATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTG +TAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTAC +ACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGA +AGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCT +GAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCC +TCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGC +ACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATT +AAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGA +AATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCT +GTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACAT +CACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAAT +GTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATT +AGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATAT +GAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGG +AGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAAT +AGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGT +GACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTT +GCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCA +GCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAAT +TTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAG +TAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAAT +TAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAA +AAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACAT +AACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTT +AAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATT +ATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGA +AGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACT +TTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACT +CTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACA +TTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATT +CAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAG +AGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATT +GTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGG +AAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGG +AAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGC +TGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAA +GACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGAC +TGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCAC +TGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAG +AGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAG +TATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATC +CGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGAC +TTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCAT +ATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGG +AGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115490.1 +CGCTAGTTTAGAGATACTCTTATAACTACAGAACACGCCAACCAAATCGCTAAGAGGGGG +GGCCCGACTGTGGTTACTAAAGATCCATCCAAAATCTCTAGCAGTGGCGCCCGAACAGAC +TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGC +AGTGGCGCCCAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGA +ACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC +TGGTAACTAGAGATCCCTCAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTG +GCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGA +ACAAATCTCAGCAGGGGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAA +GAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGA +AGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAA +AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCA +AGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGT +AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCA +TTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACC +AAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAA +GTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAAC +CTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAA +GTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAA +GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCT +ATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCA +GTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCA +GGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCA +GTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTAT +AGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTA +GACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG +ACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTA +GGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGC +CATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATG +CAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAA +GGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAG +GAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGG +CCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCA +CCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCA +AGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCG +TCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATA +CAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTG +GAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAG +CTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGA +CTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAAT +TAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAA +AAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGC +CTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGA +GAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAAT +TAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGG +GTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCA +TACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGG +GATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTA +GAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTG +ACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGT +GGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTT +ATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCT +GGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACG +CAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGG +TAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAG +AACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGC +AGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAG +GAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAG +TACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTAC +CTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTC +CTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAG +AACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAAT +TAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACA +CAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAG +AAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATA +AGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCT +ACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAG +TCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACC +ATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAG +TAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATG +GACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAG +TTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAG +AGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAA +CAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGT +GGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAG +AATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATC +TTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTG +GGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAG +AATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAG +ATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATAC +AAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATG +GCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGG +AACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGA +CATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGAT +GCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTG +GGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGAC +CTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGA +AATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAG +GTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCA +CCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAG +GGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATG +AAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAA +CTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGT +TTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAG +CAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCT +AAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTC +ATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCT +CCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATG +CAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTT +GTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGG +TTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAG +GAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTG +TAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGC +AAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGT +TTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAA +TGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGT +AATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAC +TTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGAT +GGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCA +GAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAG +TTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTT +TGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGA +TAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGG +AATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGT +AGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGA +ACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGG +ACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTG +TAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGA +ACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTAT +AATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAA +TAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACT +CCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGC +CCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAG +AGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGA +CAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGC +ACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGC +TGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCT +GACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAG +AGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCA +GGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGG +TTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAA +ATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAA +TTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGA +ACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAA +ATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAAT +AGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTT +TCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGG +TGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTG +GGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGAT +TGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTG +GAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGT +CACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTG +TAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATA +AAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAA +TGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGAC +ATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAG +CACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAA +TGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAG +GGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAG +GCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCT +TTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACA +ACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAA +TGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGT +ACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTTCGCTGGGGACTTTCCA +GGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGC +AGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCT +CTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115576.1 +AACAGACTCTGGTAAGTAGTGGTCCGCTCAAAATCTCTAGCAGTGGCGCCCGACTCTGGT +AACTAGAGATCCCTCAAAATCTCTAGCAGTGGCGCCCGATCAAAATCTCTAGCAGTGGCG +CCCGAGACTCTGGAACTAGAGATCCAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAG +AGATCCCTCAGTGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCC +CTCAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCAAATCTCTA +GCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCAGTGAAATCTCTAGCAGGAGCTCT +CTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGG +TGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGA +GCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGG +GGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTT +GCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTA +CAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTC +CTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTA +GAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGAC +ACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACAT +CAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTC +AGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTA +AACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACC +ATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCA +CCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAG +GAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGA +TGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGAT +ATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTA +AGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAA +AATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAG +GAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCT +GAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAAC +CAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGC +AGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGAC +TGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCA +GGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTT +GGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCC +TTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGC +AATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTT +TGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGAC +AGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAG +GACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAA +ATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCC +CAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTA +CAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTC +CAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAG +AACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAG +GGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTC +CCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGA +CACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAA +TATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAG +TTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATA +GAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACA +AAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGT +GGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGA +AGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAAT +TATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAG +CAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATT +ATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACAT +ATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGG +GTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAA +GCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGG +AGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATA +CCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAA +CTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCA +CTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGT +TACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACT +CACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCA +ATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCAC +ACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAG +TACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATT +GGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCA +GCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAG +GAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATG +TAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCAT +ACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCA +GCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAAT +TTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAA +AGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGG +CAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAA +GAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAA +AAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAG +CAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAG +TAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATG +ATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCAT +ATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCAT +CCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACA +TATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAA +TGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCAT +CTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATA +GTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTG +GCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAA +CTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACA +ATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTA +GGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAG +GAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGT +GTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGAT +CCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGC +TATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATC +TCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGAT +CAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCA +ATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATA +GAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAA +AGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATG +GAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTG +GGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGC +ATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGT +ACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACAT +GTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAG +CCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAA +TGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTG +CTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTA +TAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAA +CACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTA +TTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGG +ACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAAC +TCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTT +CACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTAC +AAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGC +AACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATG +GAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAAT +AATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGG +AGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTG +GACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGAT +TATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAAT +TAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGA +GACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATA +TAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAG +AGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGG +AGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTT +ATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACA +TCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGA +AAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTG +CACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGA +TAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACAC +CTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGA +TAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATT +ATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTAT +AGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCC +GAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAG +ATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTG +CCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACT +TCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGAT +TCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGA +GGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACC +TACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAA +AAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAG +CAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCA +ATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAG +TGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCG +ATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAA +GACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGA +ACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAG +TACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGA +GCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCC +TAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATT +GAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGG +GACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGG +GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCAC +TGCTTAAGCCTCAATAAAGCTTGCCT diff --git a/tests/expected-results-large/nonintact.fasta b/tests/expected-results-large/nonintact.fasta index 9113fa3..29434e4 100644 --- a/tests/expected-results-large/nonintact.fasta +++ b/tests/expected-results-large/nonintact.fasta @@ -264,169 +264,6 @@ ACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGAT TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTC ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA >MN090335 GGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGGCTCCTTCTGATAA TGCTGAAAACATGGGTATTACTTCTGGGCTGAAAGCCTTTTCTTCTACTACTTTTACCCA @@ -731,166 +568,6 @@ CCGCTAGGGACTTTCCAGGGGAGGCGTGAACTGGGCGGGACAGGGGAGTGGCGAGCCCTC AGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGAT CAGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT GCCTTGAGTGCTTAAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC ->MK115581.1 -AAATTGGGACGTTCGCCTACGCAAGCGAAAATTTCTCTACGTAGCCACCTTTCCCGATTA -ACGTCAGAACCCTAAAATTAAAATAAATCCTAGCGGCCGACCGACTCTGGTAACTAGAGA -TCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC -TCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACA -GACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAATCATCTT -AGAGTGGCGCCCGAACGACTCTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGT -GGCGCCCGCGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCG -AGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGACT -CTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGACACAGGTACTA -GAGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG -CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAG -CGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAG -ATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATT -TAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACAT -CAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAG -AACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGG -TACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAA -AGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCA -TAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATG -CATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAG -CATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGAC -ATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATA -GATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAA -GTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATC -CACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAG -TAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTA -GAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAA -AAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTT -TAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGG -GGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTA -ATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATT -GTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGA -AATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAG -GGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGC -CAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGA -AGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCA -GCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGG -AGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGAT -AGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTG -TGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAG -AAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGT -ACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGA -AGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTC -AAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAG -TACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTG -GGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGT -ACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATAC -TGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGT -GCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTT -AGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTA -TGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACA -TCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCT -TTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGA -AAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAG -TCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGC -ACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGA -AATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGA -AGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAA -TCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATT -AACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAA -ATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGC -CACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCA -ATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAG -AGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTC -CCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGA -TTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGC -ACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAA -GGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGT -AGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGC -CCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATAT -ACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGA -GGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCT -AGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGT -TATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATG -GCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGC -CGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCA -AGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCA -GGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAA -AGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCT -ACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAG -GGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGC -AGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCAT -TAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGA -TTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGAT -GGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCC -CACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAG -AATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAG -TTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAAT -CTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAG -GACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGA -GAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACC -AGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGA -ACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACA -TATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCA -ACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCC -ACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAG -GAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCC -AAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGC -GACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAG -TATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAA -TAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAA -GGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTG -AAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATG -TTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTA -TGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAG -GCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTA -GGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATG -CATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCA -CTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAG -GAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGA -AATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAT -GATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCA -AAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTA -AAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAA -TGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCA -GAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTA -CATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGT -ATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGA -CAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAA -AAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGAC -CCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACA -CAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGA -AACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAA -GCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTA -CTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGA -GATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCA -TTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTG -GGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCG -TCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAAC -AATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATC -AAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTG -GGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGT -TGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGA -GAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAG -GAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTT -AACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATA -GGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCA -CCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATC -GAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTG -GCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGAC -TTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTC -AAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGC -TTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTA -CAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGG -GCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGT -AAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGA -CCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGC -CTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCC -TTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGG -GGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTA -CAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATA -TCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCA -AGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAA -AGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAA -GCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTG -GGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGC -TGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGC -CTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTG -CACTCAAGGCAAGCT >MK115690.1 TGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACA CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCAC @@ -1686,165 +1363,6 @@ CCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGAC CAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAA AGCTTGCCTTGCACTCAAGGCAAGCTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC TAGAGA ->MK115498.1 -AACACGGAATGGGAGATAAGCAGCATCTCTATCGGCGCGGCGAGATCTGACACTGGTAAC -TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC -CCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCCTAAATCTC -TAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTG -GCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC -TCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGAC -TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAA -CTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACTAGAGATCCCT -CACCCTAGATCTCTAGCAGTGGCGCCCGCGAAGGCACTAGGACCTGAAAGCGAAAGTAAA -ACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGA -GGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGA -GAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATT -CGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGG -GAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAA -ATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTT -AATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAA -GCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCA -GCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAG -GGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTA -GAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCC -ACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAA -ATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAT -GCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACT -ACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGA -GAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCT -ACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGG -TTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAA -ACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCA -GCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAA -GCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGA -GGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCAC -ATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGA -CATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCC -CACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAA -GAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGAC -AAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAA -TAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTAT -TAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTT -TTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAG -GTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGC -TTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGC -CAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCAT -TAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAA -ATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAAT -TAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAA -TACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATG -CATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTA -GTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGA -AAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGC -AAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAG -AAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGAC -TTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAAC -TCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTG -TCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGA -TTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTAC -CACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAG -TACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCA -ATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAAT -ATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAA -AGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATAC -AAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGT -GGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCA -TAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCA -AAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAA -ATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAA -ACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTG -AATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGG -CATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTA -CTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGA -AATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAA -AAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAG -TAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCC -TGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAG -GGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATAC -ATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAG -GGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCA -TGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGA -CAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGT -ATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTAC -AGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCAC -TTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATA -ATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAAC -AGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGT -TTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCAC -TATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGA -TTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAG -GGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCA -GACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCC -ATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGC -TCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTA -CCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCAC -AGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGG -TTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATG -GGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTC -ATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAA -ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACT -CCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAA -AAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAA -GGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCT -CTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGG -ACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATT -GATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAA -TTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGC -TACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACAC -CACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGC -CACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGAC -AGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAA -TTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAA -TTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGA -AGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGA -ATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATAC -ATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCC -AATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAA -GTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAA -GCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAAT -TAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTAT -ACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGG -AAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCT -TAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATA -TGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCA -TACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTAC -TTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATG -CAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCC -CATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGG -TGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTG -GAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCAC -CAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTT -CCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGT -ACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTAT -TGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAG -AGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTC -TGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCT -GAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACAC -AGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGA -ATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCT -GTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTT -TGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGAC -CCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGA -AAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGA -CCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAAC -AAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCT -CCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGC -CATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGC -TCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGG -GGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGAC -GAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAG -CAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAG -AAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTT -TCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAA -TTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACT -TCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGT -GGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCT -TGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGA -AGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACA -AAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAG -GTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGC -GTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCT -AACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115211.1 CTTCTAGCCTCCGCTAGTCAAAACGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAA GCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTTTCAAGTCCCTGTTCG @@ -2777,165 +2295,6 @@ CATAGAGTTTTCCACCAGGGACTTTCCAGAAGAGGCGTGGCCTGGGCGGGACCGGGGAGT GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTGCCTGTACTGGGTCTCTCTGGT TAGACCAGATCTGAGCCTGGGAGCTCTCTGTCTAACTAGGGAACCCACTGCTTAAGCCTC AATAAAGCTTGCCTTG ->MK115491.1 -CTGATTTGCTGTGGCGGCCGCAAGGACTCAAGTAGGTAACTATAGAAACCCCCCACCAAT -TCTCTAGCAGTGGCGTCCGACGCTGGCCAAAACTCTCTAGCAGTGGCGCCCGAACAGACT -CTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAG -ATCCCAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATC -TCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTG -GCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCGCCC -GACTCTGGTAACTAGAGATCCCTCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTA -GAGACTCAGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACG -CCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAA -TATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGA -AAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTA -ACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCAT -CCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATT -GTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAG -AGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAA -ACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCC -TATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAG -AAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCA -TGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATG -AGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCC -AGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAA -TAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAA -TCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAAC -AAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTG -AGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGA -ATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGA -TGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAA -TGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAA -AGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCC -CTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAG -AGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACT -TCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAG -AGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTT -CCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAA -AGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGG -AAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGA -TCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTAC -ACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCC -CATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGT -TAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAAT -GGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATT -TGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAA -TAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAA -AAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGA -TAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGG -GATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCA -AAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTA -TCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAA -AATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACA -TCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGT -ACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGT -GGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAA -ACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCT -AGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCC -ATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAAT -TTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCA -CACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGT -AATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATG -GTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCC -CTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTA -TGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAG -AGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGC -AATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATA -TACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGAT -AATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGG -AATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATT -TCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGC -AATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGA -TAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATG -GCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAG -TGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCT -CCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTT -CACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCAT -TCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAAT -TATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATT -CATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGT -AGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCA -AAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCT -TCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCC -AAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGT -GGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATG -TTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAA -TAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGG -GCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAA -AAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATT -ACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTC -CTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAA -AAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAG -AGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATG -GACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTG -GCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGA -GGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACA -TAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGAC -TAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTA -AAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATG -GCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATT -CTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAG -GATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATA -GGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAA -AAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGG -GGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACA -GTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGAT -GCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACA -GACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAA -AATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAG -CCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACT -AATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTC -AATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTT -GATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCA -GTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCC -CCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGT -AAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTA -CTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAAC -AATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCC -AACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGA -GCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAAT -ACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTT -AATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAA -TTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGG -AATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAAC -AGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGT -TCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAG -ACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATAT -AAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTG -CAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCA -GGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCT -GGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTG -CAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATAC -CTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACT -GCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATG -ACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATT -GAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGG -GCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATA -ATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAAT -AGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGA -CCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTT -CGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTC -CTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGA -CGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAG -CTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACA -GATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGA -ATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAG -TGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGG -GGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGC -AGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTT -TCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAG -CCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGA -TATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACAC -ACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGT -GGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCA -TGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATT -TCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTT -CTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGG -GAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCT -CTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAA -GCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC -GCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACTCTGG -TA >MK116110.1 CCTGAAAGCGAAAGTAGAACCAGAGAAGTTCTCTCGACGCAGGACTCGGCTTGCTGAGCT TTATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCT @@ -3087,166 +2446,6 @@ CTGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCCGCTTTCGCCTGTACTGGGTC TCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTGGGGAACCCACTGCT TAAGCCTCAATAAAGCTTGCCTTGAGTGCTTAAAGTAGTGTGTGCCCGTCTGTTGTGTGA CTCTGGTAGTTACCAGAGTCACACAAC ->MK115527.1 -ACCTATTACAGCCCATAAAGAGGAGAAACGAACATAAAGCTAGTGCAAACCTGACTGCCC -GAGGCAGGGAGCTAGAGTTAGGTAACTAAAGCTCAATCACTAGCGCTCGAGCATGAGGGA -CTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACATAAATCTCT -AGCAGTGGCGCCCTAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAG -CAGTGGCGCCCGAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCA -GTGGCGCCCGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGA -ACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAAC -ATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACAT -GACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGCGCGACATGAGGCTCGGT -AACTAGAGATCCTCAGTAAATCCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAA -GCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGAC -TAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAAT -TAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAAC -ATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAA -CATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAG -AAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAC -AGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGA -AAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACC -CCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAA -ATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTT -CAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGG -GACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGG -ATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGG -GAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATA -ATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAA -TAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCT -TTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGG -TAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTA -TTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAG -TGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAG -CTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCA -ATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTT -GGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTT -TAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAG -AGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTC -AGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTG -GCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATAC -AGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAAT -GATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAAT -CTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGG -AAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAAC -TGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGAC -AGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAAT -TTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGA -CAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTT -TTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAAC -AGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTA -TACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAA -TGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAAT -CTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTT -GTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACA -ACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATT -CCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCC -AGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGC -AAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAA -AGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAG -GGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGC -AGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAA -AAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACA -ATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCC -TAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCA -AGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTA -CCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAA -TAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTAT -CTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCA -GGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCA -AGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAA -AAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACA -AGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAA -GGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAA -TATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGG -AGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACA -TCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGA -AGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAG -ATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAA -GGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAG -TCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGA -TCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAG -AAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGA -CCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTA -CAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGG -GGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAAT -CATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGA -GGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAG -GATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACA -TCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAA -GAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACAC -AAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAG -AATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAG -CAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAA -AGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGC -ACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGA -GGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACA -ACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCT -GCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGT -GCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACC -CAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATT -GCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGAC -AGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -TAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAA -TAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAA -AAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGA -GTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGG -ATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCT -GTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACA -GAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAA -GTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAG -ATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACC -CCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGT -GAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATA -AGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGAT -AATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGT -CCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATT -CTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTA -CAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTA -GCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATA -GTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAA -AGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATA -AGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTT -GAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGG -GACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACA -ACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGAT -GGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGA -AAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGG -TTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGA -GGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAG -CCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCA -GTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCA -GCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAA -AACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGC -ATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGC -CTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCT -AGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAA -AGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAG -CAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGG -TTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTG -ATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATAT -TCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGA -ATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTC -TTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGA -GACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATC -CTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATT -AGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTA -GTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAA -AGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGC -TGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCG -AGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTG -CGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGT -GCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAA -GGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGT -CTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAG -ATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAA -TCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGA -AAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGA -GAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCG -CTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGA -TGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTG -AGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCC -T >MK114997.1 TGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTTTCAAGTCCCTGTTCGGGCGCCACT GCTAAGATTAGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACT @@ -3399,166 +2598,6 @@ CTGCATCCGGAATATTTCAAGGACTGCTGACACTGAGATTTCTACAAGGGACTTTCCGCT GGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCTCAGATG CTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAG CCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT ->MK115518.1 -TCCATTGCCCAGTTGTATCAGCTCAAGCTAGTTTCGCACAGAACCCTCTTACAAGAGCTG -CCGCCGAGACCGATACTAGTAGCGAGCGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCT -AGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGG -CGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAAC -TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACCTCCTAAATCTCTAGCAGTGG -CGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTC -CTAAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCCTCCTAAATCTCT -AGCAGTGGCGCCCGAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGC -CCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAACTCTGGACT -CTGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG -CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGC -GGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGA -TGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTT -AGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATC -AGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGA -ACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGT -ACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAA -GGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCAT -AGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGC -ATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGC -ATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACA -TCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAG -ATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAG -TGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCC -ACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGT -AAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAG -AGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAA -AAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTT -AAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGG -GGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAA -TGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTG -TGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAA -ATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGG -GAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCC -AACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAA -GCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAG -CGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGA -GCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATA -GGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGT -GGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGA -AATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTA -CCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAA -GAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCA -AAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGT -ACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGG -GAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTA -CTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACT -GCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTG -CTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTA -GAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTAT -GTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACAT -CTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTT -TGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAA -AAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGT -CAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCA -CTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAA -ATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAA -GTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAAT -CTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTA -ACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAA -TTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCC -ACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAA -TTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGA -GAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCC -CTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGAT -TCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCA -CAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAG -GAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTA -GACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCC -CAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATA -CCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAG -GCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTA -GAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTT -ATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGG -CCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCC -GCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAA -GGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAG -GCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAA -GGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTA -CAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGG -GACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCA -GTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATT -AGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGAT -TAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATG -GTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCC -ACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGA -ATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGT -TGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATC -TGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGG -ACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAG -AAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCA -GAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAA -CTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACAT -ATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAA -CAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCA -CAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGG -AAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCA -AGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCG -ACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGT -ATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAAT -AGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAG -GATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGA -AGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGT -TGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTAT -GGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGG -CACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAG -GATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGC -ATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCAC -TCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGG -AGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAA -ATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATG -ATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAA -AGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAA -AGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAAT -GTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAG -AAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTAC -ATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTA -TCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGAC -AAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAA -AATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACC -CAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACAC -AGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAA -ACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAG -CAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTAC -TATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAG -ATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCAT -TAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGG -GAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGT -CAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACA -ATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCA -AGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGG -GAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTT -GGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAG -AAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGG -AAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTA -ACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAG -GTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCAC -CATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCG -AAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGG -CACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACT -TACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCA -AACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCT -TATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTAC -AAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGG -CATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTA -AGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGAC -CTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCC -TGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCT -TTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGG -GGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTAC -AACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATAT -CCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAA -GGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAA -GAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAG -CATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGG -GGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCT -GCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCC -TGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115065.1 TAGCCTCCGCTAGTCAAAAATTTCGGCGTACTCACCAGTCGCCGCGCCTCGCCTCTTGCC GTGCGCGCTCAGCAAGCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTT @@ -3877,167 +2916,6 @@ AAGAGGCGTGGCCTAGGCAGGACCGAAGAGTGGCGAGCCCTCAGATGCTGCATAAAAGCA GCTGCTTTTGCCTGTACTAGGTCTCTCTAGTTAGACCAGATCTGAGCCTAGGAGCTCTCT GTCTAACTAAGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTA GTG ->MK115530.1 -TAACTAGCAGTCCCCCGCGGCGGCCCGGCAATGGCTGGACCCGACCCCCCAACCCCTGCC -GCCGGCGCCGACTATCGAGACTGGTAACCCCCCACCCCCCAACCCTAGCCGCGCGGCCCG -ACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACAGACTCTG -GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGC -AGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCATCCCAAATCTCTAGCAGTGG -CGCCCGAACAGACTCTGGTAACTAGAGATCCCCAGCTCTAGCAGTGGCGCCCGCGACTCT -GGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAG -CAGTGGCGCCCGACTGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGG -CCCCGAGCTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACA -GACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC -TGGTAACTAGAGATCCCTACTCCAATCTCAGCAGCTCTCTCGGCGCAGGACTCGGCTTGC -TGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTT -GACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAA -AATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAA -AACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAG -AAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGAT -CAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGA -TACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTA -AGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATT -ACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTT -TAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGT -TTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGG -GGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAAT -GGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAA -GGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAA -ATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATA -AAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAAC -CCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGG -AGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGA -CTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAG -GAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATT -CAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTT -TCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCT -GTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATT -TTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGAC -CAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCT -CTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCT -TTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGA -TACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAA -AATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGA -AATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAAT -TGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGA -AACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATT -GACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAA -AATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAA -AGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGA -CTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGT -AACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAA -GTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTA -CAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAA -AATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGA -TTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAG -ACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCC -ATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACT -GCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTG -GGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAAC -CAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAA -CAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAAT -AGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATT -TAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAA -ACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAAC -TCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTG -GCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATG -GTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGC -TAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGT -TATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTT -GCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCAT -TCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAAT -AAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGA -ACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGA -TAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTT -TAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAA -AGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTAC -ACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGC -AGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGG -GAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGT -TAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCA -AAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAG -AGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAA -AAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAAC -AGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTA -TTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGA -AGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAA -AATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGA -TGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTA -AAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTAC -ACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAG -AAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCA -CACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTT -CAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATC -AAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACAC -CAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACG -AGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTT -AGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGG -ACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAAC -CCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCAT -TGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGC -ACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTC -ATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGA -GACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT -AAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAG -CAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGAC -AAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATG -AGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTG -GGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTA -CCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACC -ACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAA -GAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAA -CAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTA -ACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGT -AGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAA -ATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATA -GATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCC -TGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCG -ATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACA -GTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGT -TTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATA -ATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATG -AAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGAT -ATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTA -GTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGA -GGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAAT -ACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTA -GATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTA -GGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACA -GGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGA -GGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATT -GAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGA -GCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGC -GCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAG -CAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGG -GGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAG -CGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAAT -GCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGG -GAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAAC -CAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAAT -TGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGA -TTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGA -TATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAA -GGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGA -TTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTG -AGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAA -ATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCT -ATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAA -GTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTG -GAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCC -TGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATC -TCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGA -TTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCA -GGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGA -AAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTG -GGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGAC -CAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGC -CAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCC -GGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCG -AGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTT -TCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTC -AGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGAT -CTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT -GCCT >MK115520.1 ATCTCTAGCAGAAGCGCCCGACCAGACTCTGGCGACCGGACACCGTTCATCCCTTGGAGA CCCGCCAGACTCAAGCTATTGCAGTGGCGCCCGACTCTGGAACTAGAGATCCCTCACCCT @@ -4199,168 +3077,6 @@ AGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTC TGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAG CCTCAATAAAGCTTTGCCTTCTAGATGTGTACAATCTAGTTGCCATATTCCTGGACTACA ATCTACTTGTCCATGCATGGCCTCTCCTTTTGCTGACATTTATCACAGC ->MK115503.1 -GCTCTCGAACAGTGCGGACTCTGGTAACTAGAGATCCCTCAGCTCTAGCAGTGGCGCCCG -AACAGAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCTAAATCTCTAG -CAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTACTCTAGCAGTGGCGCCCAGA -ACATGGACTCTGGTAACTAGAGACCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGT -AACTAGAGATCCCTCCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAG -ATCCCTCCTAACTCTAGCAGTGCGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGC -AGTGGCGCCCGACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCG -CCCGAGAACAGATCTGGTAACTAGAGCCCTACTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACT -AGAGATCCTCCTAAATCTCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC -CCTCAGCTCTAGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGGGACTCTGGT -AACTAGAGATCCTCACTAAATCTAGCAGTGGCGCCGAGAGGAGACTCTCTCGGCGCAGGA -CTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGA -AAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATT -AAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAA -ATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCC -TGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCT -TCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGT -ACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCA -AAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAG -CAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATC -ACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGT -CATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCT -AAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGA -AGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGAT -GAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGC -ATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTT -GGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGG -ACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCA -AGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCC -AGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGAC -AGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAG -CCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGAT -TGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAG -GAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAG -ACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCT -TCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGAC -AATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCT -CAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAA -GCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAA -TGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAG -ATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCT -GTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATT -AGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAA -CAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAA -AAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCT -ATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAG -AGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAG -AAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAA -GAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATT -AGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGT -AGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAA -TACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATA -GAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAG -AAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAG -CCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGA -AAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTC -CTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAA -CTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCA -AAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTAT -CAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACT -AATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATA -TGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGG -GCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTA -GTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTA -GATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGA -AGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATT -TATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACA -TTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATA -GAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATT -GGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTA -GATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATG -GCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAA -TGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAA -CTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGA -TATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTG -AAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACC -AGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCC -TACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATA -GGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATC -CACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGAT -ATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAAT -TTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTC -TGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGG -AGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCA -AGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTC -AAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAG -TTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCT -GAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAG -GAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTT -TGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAG -GTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGC -ATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGA -TAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACA -TTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTC -CATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCC -ATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGC -AGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGA -GCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAA -GTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAG -GAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCT -ATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATT -AGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAA -AATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGA -CAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCA -CCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCT -ATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTA -AAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACC -CCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATA -ACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCAT -GTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATA -CCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATA -TCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATG -TAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCA -TTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGG -CTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAA -ATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGT -TAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATG -CTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACA -ACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCA -TAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTT -TAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATC -ACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTT -TCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATG -CTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGT -GGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCAT -CAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCT -TCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAG -TAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAA -GAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAA -GCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTA -TAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAAC -TCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAC -AGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTG -TGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCT -GGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAA -AGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAA -GTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGA -TAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAG -TTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCG -ACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGAT -TAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCT -GCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCA -GGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAA -AGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATA -GGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAA -GACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGG -GGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTG -GGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCT -ACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCA -GTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCAC -TTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATC -CTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCA -GGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAG -CCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGG -ATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCAT -CACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTAC -AAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGT -GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGG -TTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCT -CAATAAAGCTTGCCTTG >MK115570.1 AACGTGTCGTGCCCCCAAAACATAACGTAAACGTGGAAGCGGAGAGCCTTAAGGTAACTG CGGGGCCCCAAATCCAATATCTAGGGCGCCCGAACGAGACTCTGGTAACTAGAGATCCCT @@ -4521,163 +3237,6 @@ TCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCT CAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGA TCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCT TGCCT ->MK115509.1 -CCCCAAATCTCTAGCCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCCCAAATCTCT -AGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCC -TAAATCTCTAGCAGTGGCGCCCGAAGACTCTGGTAACTAGAGATCCCTCACCCTAAATCT -CTAGCAGTGGCGCCCGCTCGTACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCACCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTG -GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAAC -TAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTACTAGAGA -TCCCTCAAATCAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCAC -AGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAG -GCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCA -TGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTA -TGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAG -GGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTT -AAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAA -GACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCA -CAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTG -CAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGG -GTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTA -TCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAA -GCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTG -CATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGAC -ATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCT -ATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGG -ATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGAC -TATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAAT -TGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAA -GCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGA -CCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTA -ATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGC -AAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGT -GGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAA -ATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACA -GCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAG -GAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGAC -CCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAG -ATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGG -GAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGAC -ACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATC -TGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAG -TAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAA -AAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAA -TTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTA -AATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAG -TTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGG -ATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCAT -TTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGC -CACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGC -CTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAG -GATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGT -TAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGA -TGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAG -ACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGA -TTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAA -CAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTT -TAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTAC -AGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGA -AAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAG -AGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTA -GACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCT -GGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAG -AGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAA -CTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAA -CGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGG -GATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAAC -CAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAA -AAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACA -AACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAG -AAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCC -CTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCA -TGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAG -GGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTC -CAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAG -TAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCT -GTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAG -TAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTG -AACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGG -GGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAA -CTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACA -GCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAG -TAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGG -ATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGA -ACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTT -TATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTA -GGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGG -CATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGAC -CCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCT -ATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACAT -AACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGA -AAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAG -ACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTA -AGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCT -ATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAAC -TGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGA -GGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGT -CAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTT -TGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGA -AGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATAT -GTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCA -ATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATA -GACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGG -GATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGAT -GATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAA -AGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACA -TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATT -GGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGA -GGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG -TGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGG -AAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAA -GATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAA -TACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGT -ATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTG -TAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTAC -ACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGA -AGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCT -GAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCC -TCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGC -ACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATT -AAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGA -AATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCT -GTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACAT -CACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAAT -GTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATT -AGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATAT -GAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGG -AGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAAT -AGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGT -GACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTT -GCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCA -GCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAAT -TTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAG -TAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAAT -TAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAA -AAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACAT -AACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTT -AAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATT -ATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGA -AGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACT -TTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACT -CTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACA -TTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATT -CAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAG -AGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATT -GTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGG -AAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGG -AAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGC -TGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAA -GACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGAC -TGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCAC -TGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAG -AGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAG -TATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATC -CGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGAC -TTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCAT -ATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGG -AGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115702.1 GAATACTGCCATTTGTACTGCTGTCTTAAGATGTTCAGCCTGATCTCTGACCTGTCCTAT TATTTTCTTTAATTCTTTATTCATAGATTCTACCACTCCTTGACTCTGGGGATTGTAGGG @@ -4985,319 +3544,6 @@ GGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTAGGTCT CTCTGGTTAGACCAGATCTGAGCCTAGGAGCTCTCTGGCTAACTAGAGAACCCACTGCTT AAGCCTCAATAAAGCTTGCCTTGAGTGCTATAAGTAGTGTGTGCCCGTCTGTTGTGTGAC TCTGGTAACTAGAGATC ->MK115490.1 -CGCTAGTTTAGAGATACTCTTATAACTACAGAACACGCCAACCAAATCGCTAAGAGGGGG -GGCCCGACTGTGGTTACTAAAGATCCATCCAAAATCTCTAGCAGTGGCGCCCGAACAGAC -TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGC -AGTGGCGCCCAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGA -ACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC -TGGTAACTAGAGATCCCTCAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTG -GCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGA -ACAAATCTCAGCAGGGGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAA -GAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGA -AGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAA -AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCA -AGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGT -AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCA -TTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACC -AAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAA -GTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAAC -CTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAA -GTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAA -GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCT -ATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCA -GTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCA -GGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCA -GTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTAT -AGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTA -GACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG -ACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTA -GGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGC -CATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATG -CAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAA -GGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAG -GAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGG -CCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCA -CCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCA -AGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCG -TCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATA -CAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTG -GAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAG -CTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGA -CTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAAT -TAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAA -AAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGC -CTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGA -GAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAAT -TAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGG -GTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCA -TACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGG -GATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTA -GAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTG -ACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGT -GGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTT -ATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCT -GGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACG -CAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGG -TAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAG -AACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGC -AGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAG -GAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAG -TACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTAC -CTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTC -CTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAG -AACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAAT -TAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACA -CAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAG -AAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATA -AGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCT -ACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAG -TCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACC -ATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAG -TAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATG -GACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAG -TTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAG -AGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAA -CAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGT -GGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAG -AATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATC -TTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTG -GGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAG -AATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAG -ATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATAC -AAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATG -GCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGG -AACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGA -CATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGAT -GCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTG -GGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGAC -CTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGA -AATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAG -GTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCA -CCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAG -GGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATG -AAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAA -CTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGT -TTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAG -CAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCT -AAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTC -ATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCT -CCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATG -CAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTT -GTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGG -TTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAG -GAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTG -TAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGC -AAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGT -TTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAA -TGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGT -AATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAC -TTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGAT -GGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCA -GAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAG -TTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTT -TGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGA -TAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGG -AATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGT -AGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGA -ACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGG -ACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTG -TAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGA -ACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTAT -AATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAA -TAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACT -CCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGC -CCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAG -AGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGA -CAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGC -ACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGC -TGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCT -GACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAG -AGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCA -GGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGG -TTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAA -ATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAA -TTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGA -ACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAA -ATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAAT -AGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTT -TCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGG -TGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTG -GGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGAT -TGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTG -GAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGT -CACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTG -TAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATA -AAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAA -TGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGAC -ATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAG -CACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAA -TGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAG -GGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAG -GCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCT -TTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACA -ACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAA -TGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGT -ACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTTCGCTGGGGACTTTCCA -GGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGC -AGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCT -CTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT ->MK115576.1 -AACAGACTCTGGTAAGTAGTGGTCCGCTCAAAATCTCTAGCAGTGGCGCCCGACTCTGGT -AACTAGAGATCCCTCAAAATCTCTAGCAGTGGCGCCCGATCAAAATCTCTAGCAGTGGCG -CCCGAGACTCTGGAACTAGAGATCCAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAG -AGATCCCTCAGTGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCC -CTCAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCAAATCTCTA -GCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCAGTGAAATCTCTAGCAGGAGCTCT -CTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGG -TGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGA -GCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGG -GGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTT -GCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTA -CAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTC -CTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTA -GAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGAC -ACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACAT -CAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTC -AGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTA -AACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACC -ATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCA -CCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAG -GAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGA -TGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGAT -ATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTA -AGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAA -AATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAG -GAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCT -GAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAAC -CAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGC -AGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGAC -TGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCA -GGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTT -GGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCC -TTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGC -AATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTT -TGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGAC -AGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAG -GACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAA -ATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCC -CAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTA -CAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTC -CAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAG -AACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAG -GGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTC -CCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGA -CACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAA -TATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAG -TTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATA -GAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACA -AAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGT -GGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGA -AGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAAT -TATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAG -CAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATT -ATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACAT -ATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGG -GTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAA -GCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGG -AGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATA -CCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAA -CTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCA -CTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGT -TACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACT -CACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCA -ATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCAC -ACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAG -TACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATT -GGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCA -GCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAG -GAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATG -TAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCAT -ACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCA -GCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAAT -TTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAA -AGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGG -CAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAA -GAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAA -AAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAG -CAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAG -TAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATG -ATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCAT -ATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCAT -CCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACA -TATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAA -TGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCAT -CTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATA -GTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTG -GCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAA -CTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACA -ATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTA -GGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAG -GAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGT -GTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGAT -CCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGC -TATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATC -TCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGAT -CAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCA -ATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATA -GAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAA -AGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATG -GAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTG -GGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGC -ATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGT -ACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACAT -GTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAG -CCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAA -TGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTG -CTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTA -TAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAA -CACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTA -TTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGG -ACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAAC -TCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTT -CACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTAC -AAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGC -AACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATG -GAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAAT -AATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGG -AGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTG -GACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGAT -TATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAAT -TAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGA -GACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATA -TAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAG -AGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGG -AGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTT -ATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACA -TCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGA -AAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTG -CACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGA -TAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACAC -CTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGA -TAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATT -ATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTAT -AGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCC -GAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAG -ATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTG -CCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACT -TCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGAT -TCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGA -GGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACC -TACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAA -AAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAG -CAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCA -ATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAG -TGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCG -ATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAA -GACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGA -ACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAG -TACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGA -GCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCC -TAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATT -GAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGG -GACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGG -GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCAC -TGCTTAAGCCTCAATAAAGCTTGCCT >OQ092466 GACGGCCGAGGTGGCTCTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGA TCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCC diff --git a/tests/expected-results-large/orfs.json b/tests/expected-results-large/orfs.json index 54fc619..9d50b56 100644 --- a/tests/expected-results-large/orfs.json +++ b/tests/expected-results-large/orfs.json @@ -4,10 +4,10 @@ "name": "env", "start": 0, "end": 1824, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.7626080297560442, + "distance": 0.7623480451210163, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", "nucleotides": "GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" @@ -28,10 +28,10 @@ "name": "nef", "start": 0, "end": 1824, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.7645782478980201, + "distance": 0.764345579086969, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", "nucleotides": "GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" @@ -40,8 +40,8 @@ "name": "tat_exon1", "start": 1, "end": 1750, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7680130480667754, "protein": "MRKLQNGIDCIQCMQGLLHQAR", @@ -64,8 +64,8 @@ "name": "rev_exon1", "start": 1306, "end": 1750, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.758082497212932, "protein": "MRTQIVKLF", @@ -77,9 +77,21 @@ "start": 1599, "end": 1824, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, + "orientation": "forward", + "distance": 0.763687959047407, + "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", + "aminoacids": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", + "nucleotides": "ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" + }, + { + "name": "vpu", + "start": 1599, + "end": 1824, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7638478800047243, + "distance": 0.7672672672672673, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", "nucleotides": "ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" @@ -100,8 +112,8 @@ "name": "tat_exon2", "start": 1746, "end": 1824, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.7616257781032589, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", @@ -112,25 +124,13 @@ "name": "rev_exon2", "start": 1747, "end": 1927, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.7620186257236345, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", "aminoacids": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", "nucleotides": "GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA" - }, - { - "name": "vpu", - "start": 1748, - "end": 1778, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.7688723205964585, - "protein": "MHPEYYKDC", - "aminoacids": "MHPEYYKDC*", - "nucleotides": "ATGCATCCGGAGTACTACAAGGACTGCTGA" } ], "MN691959": [ @@ -175,9 +175,9 @@ "start": 5408, "end": 5699, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5391891891891883, + "distance": 0.09157509157509158, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", "aminoacids": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -186,8 +186,8 @@ "name": "tat_exon1", "start": 5679, "end": 5898, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", @@ -198,44 +198,44 @@ "name": "rev_exon1", "start": 5818, "end": 5899, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5910, + "end": 6156, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.7333193453629878, + "protein": "MQPIQIAIVALVVAIIIAIVV", + "aminoacids": "MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*", + "nucleotides": "ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG" + }, { "name": "env", "start": 6070, "end": 8656, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.13638128518734216, + "distance": 0.1405525502318391, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", "aminoacids": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*", "nucleotides": "ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA" }, - { - "name": "vpu", - "start": 6105, - "end": 6156, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.2321981424148607, - "protein": "MGVEMGHHAPWDIDDL", - "aminoacids": "MGVEMGHHAPWDIDDL*", - "nucleotides": "ATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8237, "end": 8333, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6672629695885509, "protein": "RPTSQTRGDPTGPKE", @@ -246,8 +246,8 @@ "name": "rev_exon2", "start": 8238, "end": 8514, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.210025203024363, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", @@ -258,10 +258,10 @@ "name": "nef", "start": 8657, "end": 9278, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.08588605782994552, + "distance": 0.06582796957284964, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", "aminoacids": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA" @@ -272,10 +272,10 @@ "name": "nef", "start": 0, "end": 4059, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.763072203234748, + "distance": 0.7628009106462086, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", "aminoacids": "WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*", "nucleotides": "TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG" @@ -284,26 +284,14 @@ "name": "env", "start": 2, "end": 4115, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.7604257801108195, + "distance": 0.76033143808071, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", "nucleotides": "GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA" }, - { - "name": "vpu", - "start": 2, - "end": 2084, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.7659115426105717, - "protein": "MGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ", - "aminoacids": "EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*", - "nucleotides": "GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAA" - }, { "name": "gag", "start": 789, @@ -345,9 +333,21 @@ "start": 3617, "end": 4115, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, + "orientation": "forward", + "distance": 0.7629151983204618, + "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", + "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", + "nucleotides": "ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA" + }, + { + "name": "vpu", + "start": 3617, + "end": 4115, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7635778016363703, + "distance": 0.7634058115037564, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", "nucleotides": "ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA" @@ -356,8 +356,8 @@ "name": "tat_exon1", "start": 3823, "end": 4084, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7659115426105717, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -368,8 +368,8 @@ "name": "rev_exon1", "start": 3823, "end": 4084, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.7610789980732178, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -380,10 +380,10 @@ "name": "tat_exon2", "start": 4080, "end": 4164, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.7699443413729128, + "distance": 0.769292994661058, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", "nucleotides": "ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA" @@ -392,8 +392,8 @@ "name": "rev_exon2", "start": 4081, "end": 4153, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.7667894365645325, "protein": "YPVASPQMLHISSCFLPVLGLSG", @@ -443,9 +443,9 @@ "start": 5547, "end": 5838, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.587876570313453, + "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", "aminoacids": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG" @@ -454,8 +454,8 @@ "name": "tat_exon1", "start": 5818, "end": 6037, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -466,44 +466,44 @@ "name": "rev_exon1", "start": 5957, "end": 6038, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6049, + "end": 6298, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.520618556701031, + "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", + "aminoacids": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*", + "nucleotides": "ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6212, "end": 8783, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.47520309038232134, + "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", "aminoacids": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 6253, - "end": 6298, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.3649167733674775, - "protein": "MEMGHHAPWDVDDL", - "aminoacids": "MEMGHHAPWDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8364, "end": 8460, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -514,8 +514,8 @@ "name": "rev_exon2", "start": 8365, "end": 8641, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -526,10 +526,10 @@ "name": "nef", "start": 8784, "end": 9387, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4049958673891082, + "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", "aminoacids": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA" @@ -577,9 +577,9 @@ "start": 4931, "end": 5222, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.6083541998634192, + "distance": 0.3808935556928146, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG" @@ -588,8 +588,8 @@ "name": "tat_exon1", "start": 5202, "end": 5421, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", @@ -600,44 +600,44 @@ "name": "rev_exon1", "start": 5341, "end": 5422, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5433, + "end": 5682, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5244381020335356, + "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", + "aminoacids": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*", + "nucleotides": "ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5596, "end": 8158, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.5139610675592354, + "distance": 0.5152420275849952, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", "aminoacids": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*", "nucleotides": "ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA" }, - { - "name": "vpu", - "start": 5643, - "end": 5682, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.5690703735881842, - "protein": "MGHDAPWDVDDL", - "aminoacids": "MGHDAPWDVDDL*", - "nucleotides": "ATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 7739, "end": 7835, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6842105263157894, "protein": "RPSSQPRGDQTGPKE", @@ -648,8 +648,8 @@ "name": "rev_exon2", "start": 7740, "end": 8016, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", @@ -660,10 +660,10 @@ "name": "nef", "start": 8159, "end": 8813, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.49485619884358334, + "distance": 0.4891015417331206, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", "aminoacids": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA" @@ -711,9 +711,9 @@ "start": 4859, "end": 5150, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.580763397371082, + "distance": 0.36116422349691957, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*", "nucleotides": "ATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCTTGGCTTCATGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -722,8 +722,8 @@ "name": "tat_exon1", "start": 5130, "end": 5349, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.46628407460545196, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", @@ -734,44 +734,44 @@ "name": "rev_exon1", "start": 5269, "end": 5350, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5763097949886105, "protein": "MAGRSGDSDEELLRIAGTIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLRIAGTIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5361, + "end": 5631, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5680096940321115, + "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL", + "aminoacids": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL*", + "nucleotides": "ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA" + }, { "name": "env", "start": 5524, "end": 8110, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4972760674014952, + "distance": 0.49863720871464445, "protein": "MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", "aminoacids": "MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAGGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAGCCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTAACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTAACATCAATAGCACTAATATAAACAATACCAATAGTATAGAAAGAGAAATGACAAACTGCTCTTTTAATGTCACCACAGTCATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAAACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGCTATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTAAAAATGTTAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAACACAGAAGTAAATATTATCACACTCCCATGCAAGATAAGGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACATTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 5568, - "end": 5631, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.6063492063492064, - "protein": "MGNHAHLDMGHHAPWDVNDL", - "aminoacids": "MGNHAHLDMGHHAPWDVNDL*", - "nucleotides": "ATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA" - }, { "name": "tat_exon2", "start": 7691, "end": 7784, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -782,8 +782,8 @@ "name": "rev_exon2", "start": 7692, "end": 7968, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -794,10 +794,10 @@ "name": "nef", "start": 8111, "end": 8735, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5093153589821267, + "distance": 0.5036770338593534, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", "aminoacids": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*", "nucleotides": "ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACATCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA" @@ -845,9 +845,9 @@ "start": 5446, "end": 5737, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -856,8 +856,8 @@ "name": "tat_exon1", "start": 5717, "end": 5936, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -868,44 +868,44 @@ "name": "rev_exon1", "start": 5856, "end": 5937, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5948, + "end": 6194, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6111, "end": 8652, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4564898680537425, + "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6149, - "end": 6194, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8233, "end": 8329, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -916,8 +916,8 @@ "name": "rev_exon2", "start": 8234, "end": 8510, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -928,10 +928,10 @@ "name": "nef", "start": 8653, "end": 9268, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -979,9 +979,9 @@ "start": 5552, "end": 5843, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5980919765166341, + "distance": 0.37688442211055273, "protein": "MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS", "aminoacids": "MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACACATCTATGAGACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAAGTCTGCAACAACTGCTGTTCATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGAATTACTCCACAGAGGAGAACAAGAAATGGAGCCAGTAGATCCTAA" @@ -990,8 +990,8 @@ "name": "tat_exon1", "start": 5823, "end": 6042, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", @@ -1002,46 +1002,46 @@ "name": "rev_exon1", "start": 5962, "end": 6043, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDNDEDLLKTVRFIKLLYQSSK", "aminoacids": "MAGRSGDNDEDLLKTVRFIKLLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6054, + "end": 6300, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.48542752364408415, + "protein": "MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL", + "aminoacids": "MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL*", + "nucleotides": "ATGCAATCTTTAGCAATATTAGCAATAGTAGCATTAGTAGTAGCAGCCATAATAGCAATAGTTGTGTGGACCATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGATAGTGGCAATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6217, "end": 8800, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4988789237668163, + "distance": 0.49751604598034604, "protein": "MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ", "aminoacids": "MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*", "nucleotides": "ATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCTACAGACCCCAACCCACAAGAAATAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTACATTGCACTAAGTTGGAGATTAATAGCACTAAGAAGACTAATAGCACTAATAATGGTACTAACATCAATGCCACTGATGATAGTTGGGGGGAAATGAAAAACTGCTCTTTCAATACCACTGCAAGCATAAGAGATAAGGTACAGAGAGAATTTGCGCTTTTTTATAAACTTGATATAGTACCAATAGATAATGATGATATCAACTATAGGTTAATAAGTTGTAACACCTCAGTCCTTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAAAATTTCAATGGAACAGGACAATGTAAAAATGTCAGCACAGTGCAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTCAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAAATCTGAAAATATCACAGACAATACTAAAACTATAATAGTACAGCTGAATGCATCTGTAGCAATTGTTTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGGCCAGGGAGAGCGTTTTATGCAGCAGGAGATATAATAGGAGACATAAGACGAGCACACTGTATCCTTAACAAAACAACATGGGATAACACAATAGAACAGGTAGCTAAAAAATTAAGAGAACAATTTGAGAATAAGACAATAGTCTTTAGTGAATCCTCGGGAGGGGACCCAGAAATTACAATGATTAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAGTACAACTGTTTAATAGTACTTGGCATAATAATGGGAGTAGTACTACAGGGTCAAGTAGCAGTGAAGGCAATATCACACTCCCATGCAAAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACCAATTAGCTGCGAGTCAAATATTACAGGGTTGCTACTAACAAGAGATGGTGGGAATGACGCTAACGGGAACAACACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGCGAAGTGAATTATATAGATACAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCACAGAGAAGAGTGGTACAGAGAGAAAAAAGAGCAGTGGGTCTCGGAGCCTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGCTTTGGGGTTGCTCTGGAAAACTCATCTGCAACACTGCTGTGCCTTGGAATACTAGTTGGAGTAACAAATCTCTGGATGATATTTGGCATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAACATAATATACAGCTTAATTGAGGCATCGCAAACCCAGCAAGAAAAGAATGAACAAGAATTACTAGAATTAGACAAATGGGCAAGTCTGTGGAATTGGTTTAGCATATCAAACTGGCTGTGGTACATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTATACTTTCTATAGTGAATAGAGTTAGGAAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAGTGCTGTTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGAGTTATAGAAGGATTGCGCAGAGCTTTTAGAGCTATTATCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGAGCTTTGCAATAA" }, - { - "name": "vpu", - "start": 6255, - "end": 6300, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.3649167733674775, - "protein": "MEMGHHAPWDVDDL", - "aminoacids": "MEMGHHAPWDVDDL*", - "nucleotides": "ATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8381, "end": 8474, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.5303030303030303, + "distance": 0.4918032786885247, "protein": "RPTSQPRGDPTGPKEPETKVESKTETDPLT", "aminoacids": "RPTSQPRGDPTGPKEPETKVESKTETDPLT*", "nucleotides": "AGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAG" @@ -1050,8 +1050,8 @@ "name": "rev_exon2", "start": 8382, "end": 8658, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.42982806877249113, "protein": "DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE", @@ -1062,10 +1062,10 @@ "name": "nef", "start": 8801, "end": 9425, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.46635769262600346, + "distance": 0.459649710885779, "protein": "MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN", "aminoacids": "MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*", "nucleotides": "ATGGGTGGTAAATGGTCAAAATGTAGTATAGTTGGATGGCCTACTGTAAGGGAAAGAATAAGACGAGCAGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAAGCATGGAGCAATCACAAGTAGCAATGCTAACAATGCTGATTGTACCTGGCTGGAAGCCCAAAAAGAAGAGGAGGAGGTAGGCTTTCCAGTCAGGCCTCAGGTACCCTTAAGACCAATGACTTACAAGGCAGCCTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAGGGTAGAAGAGGAGAATAAAAGAGAGAACCGCTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTACAGTGGAGGTTTGACAGCCGCCTAGCCTTTCACCACGTAGCCAGAGAGCTGCATCCGGAGTACTATAAGAACTAGAACTGCTGA" @@ -1113,9 +1113,9 @@ "start": 5345, "end": 5636, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -1124,8 +1124,8 @@ "name": "tat_exon1", "start": 5616, "end": 5835, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1136,44 +1136,44 @@ "name": "rev_exon1", "start": 5755, "end": 5836, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5847, + "end": 6093, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6010, "end": 8551, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4569687738004571, + "distance": 0.4585964351370794, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6048, - "end": 6093, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8132, "end": 8228, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1184,8 +1184,8 @@ "name": "rev_exon2", "start": 8133, "end": 8409, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1196,10 +1196,10 @@ "name": "nef", "start": 8552, "end": 9167, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4756067663643049, + "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -1247,9 +1247,9 @@ "start": 5350, "end": 5641, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -1258,8 +1258,8 @@ "name": "tat_exon1", "start": 5621, "end": 5840, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1270,44 +1270,44 @@ "name": "rev_exon1", "start": 5760, "end": 5841, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5852, + "end": 6098, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6015, "end": 8556, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4585964351370794, + "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6053, - "end": 6098, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8137, "end": 8233, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1318,8 +1318,8 @@ "name": "rev_exon2", "start": 8138, "end": 8414, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1330,10 +1330,10 @@ "name": "nef", "start": 8557, "end": 9172, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4756067663643049, + "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -1381,9 +1381,9 @@ "start": 5473, "end": 5764, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -1392,8 +1392,8 @@ "name": "tat_exon1", "start": 5744, "end": 5963, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1404,44 +1404,44 @@ "name": "rev_exon1", "start": 5883, "end": 5964, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5975, + "end": 6221, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6138, "end": 8679, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4585964351370794, + "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6176, - "end": 6221, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8260, "end": 8356, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1452,8 +1452,8 @@ "name": "rev_exon2", "start": 8261, "end": 8537, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1464,10 +1464,10 @@ "name": "nef", "start": 8680, "end": 9295, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4756067663643049, + "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -1515,9 +1515,9 @@ "start": 4951, "end": 5242, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.594871162618666, + "distance": 0.3566796368352788, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*", "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGACATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -1526,8 +1526,8 @@ "name": "tat_exon1", "start": 5222, "end": 5441, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.48954161103693805, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -1538,44 +1538,44 @@ "name": "rev_exon1", "start": 5361, "end": 5442, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5290287574606619, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" }, + { + "name": "vpu", + "start": 5453, + "end": 5699, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5682727709300466, + "protein": "MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM", + "aminoacids": "MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM*", + "nucleotides": "ATGCATATCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG" + }, { "name": "env", "start": 5616, "end": 8217, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.510440428145289, + "distance": 0.5091484869809996, "protein": "MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", "aminoacids": "MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*", "nucleotides": "ATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAGAAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAATACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGAAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAACCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 5660, - "end": 5699, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.6901936289818864, - "protein": "MGHLVPWDGDDM", - "aminoacids": "MGHLVPWDGDDM*", - "nucleotides": "ATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG" - }, { "name": "tat_exon2", "start": 7798, "end": 7891, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -1586,8 +1586,8 @@ "name": "rev_exon2", "start": 7799, "end": 8075, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -1598,10 +1598,10 @@ "name": "nef", "start": 8218, "end": 8860, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5478186258332784, + "distance": 0.5432971135257649, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", "aminoacids": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*", "nucleotides": "ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATACTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA" @@ -1649,9 +1649,9 @@ "start": 5429, "end": 5720, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -1660,8 +1660,8 @@ "name": "tat_exon1", "start": 5700, "end": 5919, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1672,44 +1672,44 @@ "name": "rev_exon1", "start": 5839, "end": 5920, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5931, + "end": 6177, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6094, "end": 8635, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4564898680537425, + "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6132, - "end": 6177, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8216, "end": 8312, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1720,8 +1720,8 @@ "name": "rev_exon2", "start": 8217, "end": 8493, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1732,10 +1732,10 @@ "name": "nef", "start": 8636, "end": 9251, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -1783,9 +1783,9 @@ "start": 5022, "end": 5313, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5885636318531382, + "distance": 0.3808935556928146, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*", "nucleotides": "ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAACTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGGGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -1794,8 +1794,8 @@ "name": "tat_exon1", "start": 5293, "end": 5512, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", @@ -1806,44 +1806,44 @@ "name": "rev_exon1", "start": 5432, "end": 5513, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELLRITRTIKFLYQNSE", "aminoacids": "MAGRSGDSDEELLRITRTIKFLYQNSE", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG" }, + { + "name": "vpu", + "start": 5524, + "end": 5794, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5776066350710902, + "protein": "MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL", + "aminoacids": "MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL*", + "nucleotides": "ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTATTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA" + }, { "name": "env", "start": 5687, "end": 8198, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.6631820277358986, + "distance": 0.6638103647692366, "protein": "MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", "aminoacids": "MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACCCAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTACTATAAACAATACCAGTAGTATAGAAGAAGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCGCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTAGGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACACTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGTAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 5731, - "end": 5794, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.6405797101449275, - "protein": "MGNHAHLGMGHHAPWEVNDL", - "aminoacids": "MGNHAHLGMGHHAPWEVNDL*", - "nucleotides": "ATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA" - }, { "name": "tat_exon2", "start": 7779, "end": 7872, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -1854,8 +1854,8 @@ "name": "rev_exon2", "start": 7780, "end": 8056, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -1866,10 +1866,10 @@ "name": "nef", "start": 8199, "end": 8823, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5148270181219111, + "distance": 0.5093153589821267, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC", "aminoacids": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*", "nucleotides": "ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACCCAGATAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA" @@ -2051,9 +2051,9 @@ "start": 5313, "end": 5598, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5871212121212123, + "distance": 0.39401343921808174, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS", "aminoacids": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*", "nucleotides": "ATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAGCTTAAGAGGGAAGCTGTTAGACATTTTCCTAGGGAATGGCTCCATAGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGGCAGGAGTAGGAGCCATAATAAGAATACTGCAACAATTACTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGGATAGGCATACTGAGGAGAACAAGAAATGGAGCCCGTAGATCCTAG" @@ -2062,8 +2062,8 @@ "name": "tat_exon1", "start": 5578, "end": 5797, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5138258357408172, "protein": "MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ", @@ -2074,44 +2074,44 @@ "name": "rev_exon1", "start": 5717, "end": 5798, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5940834141610087, "protein": "MAGRSGDRDEDLLETVRFIKFLYQNSK", "aminoacids": "MAGRSGDRDEDLLETVRFIKFLYQNSK", "nucleotides": "ATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAAG" }, + { + "name": "vpu", + "start": 5809, + "end": 6055, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5727186311787074, + "protein": "MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL", + "aminoacids": "MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL*", + "nucleotides": "ATGCAACCTTTAGAGATATCAGCAATAGTAGCATTAGTAGTAGTAGCAATAATAGCAATAGTTGTGTGGACCATAGTACTCTTAGAGTATAGGAAAATATTAAGGCAAAAGAAAATAGACAGATTAATTAATAGAATAAGTGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5972, "end": 8549, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.49969138043715056, + "distance": 0.5021538905210794, "protein": "MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL", "aminoacids": "MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*", "nucleotides": "ATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAGTGCTACAAACATGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGATGCAACCACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGATACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCGACCCACAAGAAGTAGTACTGGAAAATGTGACAGAAAATTATAATATGGGAAAAAATAACATGGTGGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTACTCTTAACCCCATTCTGTGTCACTTTAAATTGCACTGATGCTAACATCACCAGCACTAATAATAGTAGAGATAAGAAGGAAGGAGAAAGTACATTGGAGGAGACGAAAGGAGAAATAAAAAACTGCTCTTTCAATATGACTTCAAGCATGAGCGATAAGTCTCAGAAACAACGTGCACTTTTTTATAAGCTTGATGTGGTACAAATAGATGAGACTAATAATAATAGTTATAGGTTGATAAGTTGTAACACCTCAGTCGTCACACAGGCTTGTCCAAAGGTATCCTTTGATCCAATCCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATAATAAGAAATTCAATGGAACAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAACCTGTAGTGTCAACCCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAAGTAATGATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTGCAGCTGAAGACACCTGTACAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGGATAAGTATGGGACCAGGGAGAGTAATTTATGCAACAGGACAAATAATAGGAGATATAAGAAAAGCACATTGCAACATTAGTAGAGCAGAATGGAATACAACTTTAAAGCAGATAGTTACACAATTAAGAAAGCAGTGGAATAGAACCATAATCTTTAACTCATCCTCAGGAGGGGACCCAGAAATTGTGATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACAAAACTATTTAATAGTACTTGGCCACGTAATAGTACTTGGAATAATACTGAAGGGTCAAATGACACTGAAATAATCACACTCCCGTGCAGAATAAAACAAATTGTAAACAGGTGGCAGGAAGTAGGCAAAGCAATGTATGCCCCTCCCATCCAAGGACAAATTAGTTGTTCATCAAATATTACAGGGCTGCTACTAGTTAGAGATGGTGGAATTAACACCAGTGAGAGCAACGAGACCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATGCTGGGAGCTATGTTCCTTGGGCTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGTTGACGGTACAGACCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGACTCCTAGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAACACTAGTTGGAGTAATAGATCTTATGAAGATATTTGGAACAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAGGCTTAATATACACCTTAATTGAAAAATCGCAGAACCAGCAGGAAATAAATGAACAAGAACTATTGTCATTGGATAAGTGGGCAAGCCTGTGGAATTGGTTTAATATAACAAATTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAGTGCTATCAGCTTGCTCAACGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGAATCATAGGAGTAGTACAAAGAACTTGGAGAGCTTTTATCCACATACCTAGGAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 6010, - "end": 6055, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.5970755483346872, - "protein": "MEMGRLAPWNVDDL", - "aminoacids": "MEMGRLAPWNVDDL*", - "nucleotides": "ATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8130, "end": 8226, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6074396517609815, "protein": "RPPAQPQGDPTGPKKSKKEVEKETETDQCD", @@ -2122,8 +2122,8 @@ "name": "rev_exon2", "start": 8131, "end": 8407, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.47688921496698455, "protein": "DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE", @@ -2134,10 +2134,10 @@ "name": "nef", "start": 8550, "end": 8985, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.6054615099468668, + "distance": 0.6017710152157637, "protein": "MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK", "aminoacids": "MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*", "nucleotides": "ATGGGTGGAAAATGGTCAAAAAAGAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAAAATGAAGCGAACTGAGCCAGCAGCAGAGGGGGTGGGAGCAGCATCTCGAGACCTGGACAAATATGGAGCAATCACAAGTAGCAATACAGCACAGACCAATCCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAAGAGGTAGGCTTTCCAGTCAGACCCCAGGTACCTTTGAGACCAATGACTTACAAGGCAGCTGTGGATATGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAGAGACAAGATATCCTTGATCTGTGGATCTATCACACACAAGGCTACTTCCCTGATTGGCAAAATTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGAGGGTGCTTCAAGTAG" @@ -2185,9 +2185,9 @@ "start": 5033, "end": 5579, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.7661862444925697, + "distance": 0.7334692430420138, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", "aminoacids": "MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*", "nucleotides": "ATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAAACCTAAGACAATATATCTATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAG" @@ -2196,44 +2196,44 @@ "name": "tat_exon1", "start": 5486, "end": 5780, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7619181418001311, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", "aminoacids": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVN", "nucleotides": "ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAAT" }, - { - "name": "vpu", - "start": 5486, - "end": 6206, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.7713277742142399, - "protein": "MRYLCKEMQIPLYSVHQMLKHMIQKYIMFRPHMPVYPQTLTHMK", - "aminoacids": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVNNTCNATFKDISNSSISSSSNNSNSCVDHSRHKI*ENIKTKKNR*NN**NKKKSRRQWQ*ERKRSGRIVSTCSRNKARCSLRC**SVVLRKICKSQSIMRYLCKEMQIPLYSVHQMLKHMIQKYIMFRPHMPVYPQTLTHMK*", - "nucleotides": "ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAATAATACATGTAATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAG" - }, { "name": "rev_exon1", "start": 5698, "end": 5779, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAA" }, + { + "name": "vpu", + "start": 5790, + "end": 6039, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.7407973896196594, + "protein": "MQPLKILAIVALVVAAIIAIVV", + "aminoacids": "MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL*", + "nucleotides": "ATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5953, "end": 8521, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", "distance": 0.7529994904340572, "protein": "MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD", @@ -2244,8 +2244,8 @@ "name": "nef", "start": 7916, "end": 9176, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", "distance": 0.7587548638132295, "protein": "MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", @@ -2256,8 +2256,8 @@ "name": "tat_exon2", "start": 8102, "end": 8198, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.7134052388289676, "protein": "RPSSQPQEDQTGPKE", @@ -2268,8 +2268,8 @@ "name": "rev_exon2", "start": 8103, "end": 8379, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.6888374145157732, "protein": "ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE", @@ -2317,21 +2317,21 @@ { "name": "vpr", "start": 5087, - "end": 5249, + "end": 5378, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.6703246973639554, + "distance": 0.6737199868435482, "protein": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT", - "aminoacids": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*", - "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAG" + "aminoacids": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*", + "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG" }, { "name": "tat_exon1", "start": 5235, "end": 5577, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.6325105553751218, "protein": "MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", @@ -2342,8 +2342,8 @@ "name": "rev_exon1", "start": 5497, "end": 5578, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSRDSDEELLTAVRIIKRLYQSSK", @@ -2354,10 +2354,10 @@ "name": "vpu", "start": 5589, "end": 5835, - "subtype_start": 6259, - "subtype_end": 6310, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7710195148641255, + "distance": 0.6256860592755216, "protein": "MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP", "aminoacids": "MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*", "nucleotides": "ATGCATGCCTTAGAAATAGCAGCAATAGCAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAG" @@ -2366,8 +2366,8 @@ "name": "env", "start": 5752, "end": 8353, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", "distance": 0.7518870380010406, "protein": "MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD", @@ -2378,10 +2378,10 @@ "name": "nef", "start": 7748, "end": 8996, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.7344808947652905, + "distance": 0.7328145265888457, "protein": "MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR", "aminoacids": "MNKTYWH*ISRQVCKISLTLHSSYSI*KYS****EA**V*E*FLLYCL**IKLGKDTHHCHCRPSSQPREDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*KTYS*LRREL*NF*DAESKKH*SISRISCSIRVRK*RIVQLACSTPQQ*Q*LRGQIKL*KYYKEALELFSTYLHE*DRA*KRLCYKIGNKLSRRLKARWPAIKEKIRRARPVREPEPATAKVRAASRDLKRHGALTSSNTAATNADVACLEAQQKKEEVSFPVRPQVPLRPMTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*", "nucleotides": "ATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAAGGCTAGATGGCCTGCCATAAAGGAGAAAATAAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAACAGCTAAGGTAAGAGCAGCATCTCGAGACCTGAAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGAAGAAAGAAGAGGTAAGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGAGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAAGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATAGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAAGTAGAAGAGGCCAGTGTAAGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATAGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA" @@ -2390,8 +2390,8 @@ "name": "tat_exon2", "start": 7934, "end": 8027, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.5633802816901408, "protein": "RPSSQPREDPTGPKEQKKEVERKTEAHPRD", @@ -2402,8 +2402,8 @@ "name": "rev_exon2", "start": 7935, "end": 8211, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.6781884553958476, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE", @@ -2453,9 +2453,9 @@ "start": 5061, "end": 5352, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5625083211290105, + "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTGGGACAACATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -2464,8 +2464,8 @@ "name": "tat_exon1", "start": 5332, "end": 5551, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ", @@ -2476,44 +2476,44 @@ "name": "rev_exon1", "start": 5471, "end": 5552, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG" }, + { + "name": "vpu", + "start": 5563, + "end": 5809, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5560235888795282, + "protein": "MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL", + "aminoacids": "MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL*", + "nucleotides": "ATGCAATCCTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTGGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAGGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG" + }, { "name": "env", "start": 5726, "end": 8288, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.52645935624659, + "distance": 0.5276672448389619, "protein": "MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL", "aminoacids": "MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGGAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTACTTGGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATGAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAGAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAGGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATGGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAGGAAGCCATACAAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAGGACCAGGGAGAGCATTTTACACAACAGGAGATATAATAGGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAATAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAGGGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAGGGGAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTGGACTAAAAATGGTACTGGTAGTTGGCAGTCTAATGATACTCAGAATGGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGGAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAACTGTACATCAAATATTACAGGGCTGGTTTTAACAAGAGATGGGGGGAAGGTGATTAATGAAACTGAGACCTTTAGACCTGGAGGAGGAAATATGAAGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAAAGAGAGAAAAGAGCAGTAGGACTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCCGGAAGCACTATGGGCGCAGCGTCAATAGCGCTGACGGAACAGGCCAGACGAGTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATCGTAGTTGGGGTGGGCATAACAAAAATCTAGATGACATTTGGGGTAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAGAAAAGAATGAACAAGAATTATTGGCATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAGGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAGGGACAGATAGGATAATAGAAATATTACAAAGAATTGGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 5770, - "end": 5809, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.5690703735881842, - "protein": "MGHHAPWNVDDL", - "aminoacids": "MGHHAPWNVDDL*", - "nucleotides": "ATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG" - }, { "name": "tat_exon2", "start": 7869, "end": 7965, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6995153473344102, "protein": "RPSSQLRGEPTGPKE", @@ -2524,8 +2524,8 @@ "name": "rev_exon2", "start": 7870, "end": 8146, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.32366339007432277, "protein": "DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE", @@ -2536,10 +2536,10 @@ "name": "nef", "start": 8289, "end": 8940, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.46946145391741245, + "distance": 0.4631394979345408, "protein": "MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", "aminoacids": "MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAAGTAGTAGGGTTGGATGGAATGCAGTGAGGGAAAGAATGAGACGAGCTCAGCCAACAGCAGATAGGGAACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAATATGGAGCACTTACAAGTAGGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGATGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGGTTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA" @@ -2587,9 +2587,9 @@ "start": 5287, "end": 5578, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -2598,8 +2598,8 @@ "name": "tat_exon1", "start": 5558, "end": 5777, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -2610,44 +2610,44 @@ "name": "rev_exon1", "start": 5697, "end": 5778, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5789, + "end": 6035, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5952, "end": 8493, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4564898680537425, + "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 5990, - "end": 6035, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8074, "end": 8170, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -2658,8 +2658,8 @@ "name": "rev_exon2", "start": 8075, "end": 8351, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -2670,10 +2670,10 @@ "name": "nef", "start": 8494, "end": 9109, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -2855,9 +2855,9 @@ "start": 5449, "end": 5740, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -2866,8 +2866,8 @@ "name": "tat_exon1", "start": 5720, "end": 5939, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -2878,44 +2878,44 @@ "name": "rev_exon1", "start": 5859, "end": 5940, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5951, + "end": 6197, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6114, "end": 8655, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4564898680537425, + "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6152, - "end": 6197, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8236, "end": 8332, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -2926,8 +2926,8 @@ "name": "rev_exon2", "start": 8237, "end": 8513, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -2938,10 +2938,10 @@ "name": "nef", "start": 8656, "end": 9271, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -2988,10 +2988,10 @@ "name": "env", "start": 4985, "end": 8207, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.6663239775063792, + "distance": 0.6657028690558922, "protein": "MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*LRALETSRKSTYDCL*QLLL*TVLLSLPSLLHHKRLRHLLWQEEAETATKSFSQQSESSSGSTRAVSITCNACLKNSSNSRISSSNNNSNSCVVYSINRI*ENFKTKENRQVN**NKRKSRRQWQ*K*RRPGGIISTCGDGASCSLGW**YVVPTTCGSQSIMGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*", "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAGTATTACATGTAATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGAAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAGTTTAAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAGACTTGATGTAGTATCAATAGATGAAGATAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGATATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAACCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGAGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAAAAAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAACACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCTCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAGTGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAGGCAGTGGGAAAAGGAAATTGACAATTACACAGACACAATATATAACTTAATTGAACTATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAGTTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTACTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA" @@ -3001,9 +3001,9 @@ "start": 4985, "end": 5276, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5793112277557293, + "distance": 0.3120665742024965, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*", "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3012,8 +3012,8 @@ "name": "tat_exon1", "start": 5256, "end": 5475, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -3024,8 +3024,8 @@ "name": "rev_exon1", "start": 5395, "end": 5476, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5290287574606619, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", @@ -3034,22 +3034,22 @@ }, { "name": "vpu", - "start": 5694, + "start": 5487, "end": 5733, - "subtype_start": 6259, - "subtype_end": 6310, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.6901936289818864, - "protein": "MGHLVPWDGDDM", - "aminoacids": "MGHLVPWDGDDM*", - "nucleotides": "ATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG" + "distance": 0.5568484042553192, + "protein": "MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", + "aminoacids": "MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*", + "nucleotides": "ATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG" }, { "name": "tat_exon2", "start": 7788, "end": 7881, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -3060,8 +3060,8 @@ "name": "rev_exon2", "start": 7789, "end": 8065, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -3072,10 +3072,10 @@ "name": "nef", "start": 8208, "end": 8850, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5478186258332784, + "distance": 0.5432971135257649, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC", "aminoacids": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*", "nucleotides": "ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTTCAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTTCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGTCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAATATTTCAAGGACTGCTGA" @@ -3123,9 +3123,9 @@ "start": 5505, "end": 5796, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3134,8 +3134,8 @@ "name": "tat_exon1", "start": 5776, "end": 5995, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3146,44 +3146,44 @@ "name": "rev_exon1", "start": 5915, "end": 5996, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6007, + "end": 6253, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6170, "end": 8711, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.45675101255163, + "distance": 0.4583799776107468, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6208, - "end": 6253, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8292, "end": 8388, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3194,8 +3194,8 @@ "name": "rev_exon2", "start": 8293, "end": 8569, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3206,10 +3206,10 @@ "name": "nef", "start": 8712, "end": 9327, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -3257,9 +3257,9 @@ "start": 4996, "end": 5287, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872377841979652, + "distance": 0.3351206434316354, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*", "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3268,8 +3268,8 @@ "name": "tat_exon1", "start": 5267, "end": 5486, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.48954161103693805, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -3280,44 +3280,44 @@ "name": "rev_exon1", "start": 5406, "end": 5487, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5290287574606619, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" }, + { + "name": "vpu", + "start": 5498, + "end": 5744, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5568484042553192, + "protein": "MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", + "aminoacids": "MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*", + "nucleotides": "ATGCATGCCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG" + }, { "name": "env", "start": 5661, "end": 8262, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.5065440396179699, + "distance": 0.5052314240113498, "protein": "MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", "aminoacids": "MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*", "nucleotides": "ATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAGTACTTGGAATGGTACTGACAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATAGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACCTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 5705, - "end": 5744, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.6901936289818864, - "protein": "MGHLVPWDGDDM", - "aminoacids": "MGHLVPWDGDDM*", - "nucleotides": "ATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG" - }, { "name": "tat_exon2", "start": 7843, "end": 7936, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -3328,8 +3328,8 @@ "name": "rev_exon2", "start": 7844, "end": 8120, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -3340,10 +3340,10 @@ "name": "nef", "start": 8263, "end": 8905, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5386842636859471, + "distance": 0.5339772804571117, "protein": "MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", "aminoacids": "MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*", "nucleotides": "ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTACCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAGAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA" @@ -3391,9 +3391,9 @@ "start": 5563, "end": 5854, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5898566703417862, + "distance": 0.37688442211055273, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", "aminoacids": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG" @@ -3402,8 +3402,8 @@ "name": "tat_exon1", "start": 5563, "end": 6052, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7571801566579635, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", @@ -3414,46 +3414,46 @@ "name": "rev_exon1", "start": 5973, "end": 6054, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG" }, + { + "name": "vpu", + "start": 6065, + "end": 6311, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.7521692502681095, + "protein": "MQSLYILTIVALVVAAILAIVV", + "aminoacids": "MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*", + "nucleotides": "ATGCAATCTTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTAGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAAGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAG" + }, { "name": "env", "start": 6228, "end": 8799, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", "distance": 0.7471048806788873, "protein": "MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST", "aminoacids": "MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*", "nucleotides": "ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAAGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGAAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTTCTAATACTACTTAGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATAAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAAAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAAGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATAGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAAGAAGCCATACGAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAAGACCAGGAAGAGCATTTTATACAACAGGAGATATAATAAGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAGTAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAAAGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAAAGAAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTAGACTAAAAATGGTACTGATAGTTGGCAGTCTAATGATACTCAGAATAGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCCATCAGTAGACAAATTAACTGTACATCAAATATTACAGGGCTAGTTTTAACAAGAGATAGGAGGAATGAAACTAAGACCTTTAGACCTGGAAGAGAAAATATGAAGGATAATTGGAGAAGTAAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAAGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAGAAAAGAGCAGTAAGACTAGGAGCTATGTTCCTTAAGTTCTTAGGAGCAGCCAGAAGCACTATAGGCGCAGCGTCGATAGCGCTGACGGAACAGGCCAGACGAGTCTTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTAAGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATCGTAGTTGAGGTAGGCATAACAAAAATTACAAAAGTCTAGATGACATTTAGGATAACATGACCTAGATAGAGTAGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAAAAAAGAATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 6228, - "end": 6276, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.7611885546588408, - "protein": "MRVKEIKRSYQHL", - "aminoacids": "MRVKEIKRSYQHL*R*", - "nucleotides": "ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAG" - }, { "name": "nef", "start": 8194, "end": 9451, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.6542937183493158, + "distance": 0.6514772974147296, "protein": "MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", "aminoacids": "MNKNYWH*INRQVCRISLTYHNGCGI*KYS****EA**V*E*FLLYFL**IKLGKDTHHYHFRPSSQPREEPTGPKE*KKEVERETKADPVD**TDS*HLSRTIYGAYASSATTA*ATYS*L*SRLWNF*DARGKKPSNISRISCSTRVRN*RIVLSACSTPQL***LKGQIR**KYYKELVELFSTYLGE*DRA*KRLCYKIGGKWSKSSKVK*NAVKERIRRAQPTADKERAEPAADKVRAASRDLEKYGALTSKNTAATNADCAWLEAQEEEDEVGFPVRPQLPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*", "nucleotides": "ATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTGGCAAGTGGTCAAAAAGTAGTAAGGTTAAATAGAATGCAGTGAAAGAAAGAATAAGACGAGCTCAGCCAACAGCAGATAAAGAACGAGCTGAGCCAGCAGCAGATAAGGTAAGAGCAGCATCTAGAGACCTAGAAAAATATGGAGCACTTACAAGTAAGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGATGAGGTAGGTTTTCCAGTCAGACCTCAGTTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAAGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATAGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGATTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA" @@ -3462,8 +3462,8 @@ "name": "tat_exon2", "start": 8380, "end": 8476, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6995153473344102, "protein": "RPSSQPREEPTGPKE", @@ -3474,8 +3474,8 @@ "name": "rev_exon2", "start": 8381, "end": 8657, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.5716671727907683, "protein": "RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE", @@ -3525,9 +3525,9 @@ "start": 5512, "end": 5803, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3536,8 +3536,8 @@ "name": "tat_exon1", "start": 5783, "end": 6002, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3548,44 +3548,44 @@ "name": "rev_exon1", "start": 5922, "end": 6003, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6014, + "end": 6260, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6177, "end": 8718, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4585964351370794, + "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6215, - "end": 6260, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8299, "end": 8395, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3596,8 +3596,8 @@ "name": "rev_exon2", "start": 8300, "end": 8576, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3608,10 +3608,10 @@ "name": "nef", "start": 8719, "end": 9334, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -3659,9 +3659,9 @@ "start": 5466, "end": 5757, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3670,8 +3670,8 @@ "name": "tat_exon1", "start": 5737, "end": 5956, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3682,44 +3682,44 @@ "name": "rev_exon1", "start": 5876, "end": 5957, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5968, + "end": 6214, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6131, "end": 8672, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4569687738004571, + "distance": 0.4585964351370794, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6169, - "end": 6214, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8253, "end": 8349, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3730,8 +3730,8 @@ "name": "rev_exon2", "start": 8254, "end": 8530, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3742,10 +3742,10 @@ "name": "nef", "start": 8673, "end": 9288, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4756067663643049, + "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -3793,9 +3793,9 @@ "start": 5583, "end": 5874, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3804,8 +3804,8 @@ "name": "tat_exon1", "start": 5854, "end": 6073, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3816,44 +3816,44 @@ "name": "rev_exon1", "start": 5993, "end": 6074, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6085, + "end": 6331, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6248, "end": 8789, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4564898680537425, + "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6286, - "end": 6331, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8370, "end": 8466, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3864,8 +3864,8 @@ "name": "rev_exon2", "start": 8371, "end": 8647, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3876,10 +3876,10 @@ "name": "nef", "start": 8790, "end": 9405, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -3927,9 +3927,9 @@ "start": 5453, "end": 5744, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -3938,8 +3938,8 @@ "name": "tat_exon1", "start": 5724, "end": 5943, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3950,44 +3950,44 @@ "name": "rev_exon1", "start": 5863, "end": 5944, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5955, + "end": 6201, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6118, "end": 8659, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4604674291397314, + "distance": 0.4620723847297967, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCTCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAGGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6156, - "end": 6201, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8240, "end": 8336, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3998,8 +3998,8 @@ "name": "rev_exon2", "start": 8241, "end": 8517, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4010,10 +4010,10 @@ "name": "nef", "start": 8660, "end": 9275, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -4061,9 +4061,9 @@ "start": 5321, "end": 5612, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -4072,8 +4072,8 @@ "name": "tat_exon1", "start": 5592, "end": 5811, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -4084,44 +4084,44 @@ "name": "rev_exon1", "start": 5731, "end": 5812, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5823, + "end": 6069, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5986, "end": 8527, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4564898680537425, + "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6024, - "end": 6069, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8108, "end": 8204, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4132,8 +4132,8 @@ "name": "rev_exon2", "start": 8109, "end": 8385, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4144,10 +4144,10 @@ "name": "nef", "start": 8528, "end": 9143, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -4195,9 +4195,9 @@ "start": 5048, "end": 5339, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5731147540983608, + "distance": 0.3566796368352788, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAACTTAAGCAGGAAGCTGTTAGGCATTTTCCTAGGCCATGGCTTCATAGCTTAGGGCAATATATCTATGAAACTTATGGGGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATGCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATCCCACAGAGGAGAGCAAGAAATGGATCCAGTAGATCCTAA" @@ -4206,8 +4206,8 @@ "name": "tat_exon1", "start": 5319, "end": 5538, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5237430167597767, "protein": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", @@ -4218,46 +4218,46 @@ "name": "rev_exon1", "start": 5458, "end": 5539, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5622384937238494, "protein": "MAGRSGDGDEDLLKAVRLIKTLYQSSK", "aminoacids": "MAGRSGDGDEDLLKAVRLIKTLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5550, + "end": 5808, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.6039004707464695, + "protein": "MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND", + "aminoacids": "MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND**", + "nucleotides": "ATGTTATCTTTAGAAGTAATAGTAGCAATAACAGCATTAGTAGTAGCAGGAATAATAGCAATAGTTGTGTGGACCATAGTACTTATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAAGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA" + }, { "name": "env", "start": 5716, "end": 8257, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.5208458282639616, + "distance": 0.5196110433453024, "protein": "MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE", "aminoacids": "MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*", "nucleotides": "ATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAATGCTACAGAACAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACAACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATGGTATTAATAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGATCAAATGCAAGAGGACATAGTCAGCTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACCTTAAATTGCACTAATTTGACCATTGAGCCAAACAATGCTACTAAAGCCAATATTAGTGGGAGGTTAGAGGGGAAAGGAGAAATGACAAACTGCTCTTTCAATGTCACCACAAGCCTAAGAGATAAGAGGAAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTAGCAACAGGTGAAAATAATAACAGCTTTAGGTTGATAAGTTGTAATACCTCAGAGATTACACAGGCCTGTCCAAAGGTATCATTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAAAAGTTCAATGGAACAGGAAAATGTAACAATGTCAGCATAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAGTTAGATCTGCCAATTTCTCAGACAATACTAAGACCATAATAGTACAGCTGAACAAAACTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGGAGAAGTATACATATAGCACCAGGGAGAGCATTTTATGCAACAGGAGATATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAAAGAAGATTGGAATACCACTTTAAACCAGGTGGCTAAAAAATTACAAGAACAATTTGAGAATGCAACAATAGACTTTAAACCATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACGGAACTATTTTCTTGGAATGCTACAACAAAACTGTTTACTTGGAATGCTACAAATAGCAATAATGGAACCATCATACTCCCATGTAGAATAAAACAAATTATAAACATGTGGCAAGAGGTAGGAAAAGCAATGTATGCCCCTCCCATTCGTGGACAAATTAGATGTTCGTCAAATATTACAGGACTGCTATTAACAAGAGATGGTGGGACTAACGGGACAGGGAACAGGAATGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAGAAATTAAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGACCATAGGAGCTATGTTCCTTGGGTTCCTGGGGGCAGCAGGAAGCACTATGGGCGCAGCATCACTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCGATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATAAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGGTACCTAAGAGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATATTAGTTGGAGTAATAGAACTCTGAATAACATTTGGGACAATTTGACTTGGATGCAGTGGGATACAGAAATTAACAATTACACAAACAAAATATACCAATTACTTGAGGAAGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAATTTGTGGAATTGGTTTGACATATCAAACTGGCTGTGGTACATAAAAATATTCATATTAATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTAAATGCCACAGCCATAGTAGTAGCTGAGGGGACAGATAGGATTATAGAATTAGCACAAAGAATTTGTAGAGCAGAATAAGACAGGGCTTGA" }, - { - "name": "vpu", - "start": 5760, - "end": 5808, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.70010183299389, - "protein": "MGHNAHHAPWDIND", - "aminoacids": "MGHNAHHAPWDIND**", - "nucleotides": "ATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA" - }, { "name": "tat_exon2", "start": 7874, "end": 7970, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.3921568627450981, + "distance": 0.32608695652173914, "protein": "RPASQSRGDPTGPKEPKKKVERETETDPTD", "aminoacids": "RPASQSRGDPTGPKEPKKKVERETETDPTD**", "nucleotides": "AGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGA" @@ -4266,8 +4266,8 @@ "name": "rev_exon2", "start": 7875, "end": 8151, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.3471418653089562, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE", @@ -4278,10 +4278,10 @@ "name": "nef", "start": 8275, "end": 8896, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.47444962236863253, + "distance": 0.4680383864671438, "protein": "MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC", "aminoacids": "MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAACATAGTAAGAGTGAATGGGCTGATGTAAGGGAAAGAATGGCACAAACTGAGGCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGATCTGGAAAGACATGGAGCAATCACAAGTAGCAATACAGCAACTAACAATGCTGCTTGTGCTTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAAACCTCAGGTGCCTTTGAGACCAATGACCTACAAGGGAGCTTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTATTCCCAAAAAAGACAAGACATCCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGAACCAGATTCCCACTGTGCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTGGAAGAAGCCAATAAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACCGAGAGAGAGGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTAGCCAGAGAGAAACATCCGGAGTACTTCAAGGACTGCTGA" @@ -4329,9 +4329,9 @@ "start": 4963, "end": 5254, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.6112852664576804, + "distance": 0.4464285714285715, "protein": "MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS", "aminoacids": "MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*", "nucleotides": "ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAA" @@ -4340,8 +4340,8 @@ "name": "tat_exon1", "start": 5111, "end": 5453, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.6409453748630458, "protein": "MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ", @@ -4352,8 +4352,8 @@ "name": "rev_exon1", "start": 5373, "end": 5454, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.5290287574606619, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", @@ -4364,10 +4364,10 @@ "name": "vpu", "start": 5465, "end": 5711, - "subtype_start": 6259, - "subtype_end": 6310, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7683007254341614, + "distance": 0.7521692502681095, "protein": "MHALEIAAIVRLVVAAIIAIVV", "aminoacids": "MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*", "nucleotides": "ATGCATGCCTTAGAAATAGCAGCAATAGTAAGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAAGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAG" @@ -4376,8 +4376,8 @@ "name": "env", "start": 5628, "end": 8229, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", "distance": 0.7513561129398668, "protein": "MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD", @@ -4388,10 +4388,10 @@ "name": "nef", "start": 7624, "end": 8872, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5872017754762344, + "distance": 0.5833488893037148, "protein": "MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", "aminoacids": "MNKTY*H*ISRQVCRISLTLHSGYSI*KYS****EA**V*E*FLLYCL**IELGRDTHHCHCRPSSQPRGDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*ETYS*LWRGL*NF*DAESKKH*SIGRISCSIRVRK*RIVQLACSTPQQ*Q*LKGQIRL*KYYKEALELFSTYLHE*DRA*KKLCYKIGNKLSRRLRARWPAIKERMRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*", "nucleotides": "ATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAGGGCTAGATGGCCTGCCATAAAAGAAAGAATGAGACAAGCTAGGCCAGTAAGAAAGCCAGAGCCAGCAGCAACTAAGGTAAGAGCAGCATCTCGAGACCTAGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGGAAGAAAAAGAGGTAGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAAGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAAGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATAGAAGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA" @@ -4400,8 +4400,8 @@ "name": "tat_exon2", "start": 7810, "end": 7903, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.5303030303030303, "protein": "RPSSQPRGDPTGPKEQKKEVERKTEAHPRD", @@ -4412,8 +4412,8 @@ "name": "rev_exon2", "start": 7811, "end": 8087, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.6667847862036381, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE", @@ -4463,9 +4463,9 @@ "start": 5315, "end": 5606, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -4474,8 +4474,8 @@ "name": "tat_exon1", "start": 5586, "end": 5805, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -4486,44 +4486,44 @@ "name": "rev_exon1", "start": 5725, "end": 5806, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5817, + "end": 6063, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5278361344537815, + "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5980, "end": 8521, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4585964351370794, + "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 6018, - "end": 6063, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8102, "end": 8198, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4534,8 +4534,8 @@ "name": "rev_exon2", "start": 8103, "end": 8379, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4546,10 +4546,10 @@ "name": "nef", "start": 8522, "end": 9137, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -4597,9 +4597,9 @@ "start": 5234, "end": 5525, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5872120921305184, + "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*", "nucleotides": "ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -4608,8 +4608,8 @@ "name": "tat_exon1", "start": 5505, "end": 5724, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -4620,44 +4620,44 @@ "name": "rev_exon1", "start": 5644, "end": 5725, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5736, + "end": 5982, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5399181166837258, + "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", + "aminoacids": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", + "nucleotides": "ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5899, "end": 8440, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.45675101255163, + "distance": 0.4583799776107468, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA" }, - { - "name": "vpu", - "start": 5937, - "end": 5982, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.46723952738990326, - "protein": "MEMGHHAPGDVDDL", - "aminoacids": "MEMGHHAPGDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8021, "end": 8117, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4668,8 +4668,8 @@ "name": "rev_exon2", "start": 8022, "end": 8298, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4680,10 +4680,10 @@ "name": "nef", "start": 8441, "end": 9056, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4690990320178705, + "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA" @@ -4731,9 +4731,9 @@ "start": 5627, "end": 5918, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5625083211290103, + "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAGCTTAGGGCAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATTCTGCAACAACTGTTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -4742,8 +4742,8 @@ "name": "tat_exon1", "start": 5898, "end": 6117, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", @@ -4754,8 +4754,8 @@ "name": "rev_exon1", "start": 6037, "end": 6118, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDDELLKTVRLIKVLYQSSK", @@ -4766,10 +4766,10 @@ "name": "vpu", "start": 6129, "end": 6375, - "subtype_start": 6259, - "subtype_end": 6310, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7548091006737623, + "distance": 0.5077548005908421, "protein": "MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL", "aminoacids": "MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*", "nucleotides": "ATGCAACCTTTAACAATATTAGCAATAGTAGCACTAGTAGTAGCAGCAATACTAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAA" @@ -4778,10 +4778,10 @@ "name": "env", "start": 6292, "end": 8875, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4841544358231281, + "distance": 0.48559709145147756, "protein": "MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL", "aminoacids": "MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*", "nucleotides": "ATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAATGCTACAGAACAACAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGGTATTAAAAAATGTGACAGAAAATTTTAATATGTGGGAAAATAACATGGTAGAACAGATGCATGAAGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAGTTAACTCCACTCTGTGTTACTCTAAATTGCACTAATACCACTAGGAGTAGTGGAAATACTACCAATGAAATGAAAAACTGCTCTTTCTATACCGAAACAGACATAAGAGATAAGAAGAGAAAGGAATATGCACTTTTTTATGAACTTGATATAGTACCCATAGATGAGGATAATAAGAATAAGAGTAATAATATTAGCTATTCTAGGTTAATAAGTTGCAACACCTCAGTTATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAGAAATTCAATGGAACAGGGCCATGTACAAATGTCAGCACAGTGCAATGTACACATGGTATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGACGAGGTAGTAATTAAATCTAGCAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTAAATGAAACTGTAAAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGACATAAGACAAGCACATTGTAACATCTCTAGAGCAAACTGGACAAACACTTTAAAACAGATAGCTGAAAAATTAGGAAAACAATTTGAGGAAAATAAAACAATAGTCTTTAATCCCTCCTCAGGAGGGGACCCAGAGGTTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATTCAACACCACTGTTTAATAGTACTTGGAAGGAGACTAATGGGATTTGGACTCGTATTGGAGAGTCAAATGATAGTGCTACTATCACACTAAATGATAGTGATACTATCACACTCCAATGTAAAATAAGGCAAATTATAAACTTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAAAGGACAAATTAGCTGTTTATCAAACATTACAGGGCTGCTATTAGTAAGAGATGGTGGCAATAACACGAACGGGACCGAGATCTTCAGACCTGTAGGAGGAGAAATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAGAAAAGAGCGACATTGGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGTAATAAATCTCTGGAAAAAATTTGGAATAATATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACCTTACTTGAAGAATCGCAGAACCAGCAAGAAAAAAATGAAAAAGAATTATTGGAATTAGATACATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAATAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTCCAGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAATATTACAAAGAGCTTGTAGAGCTATTCTCCATATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA" @@ -4790,8 +4790,8 @@ "name": "tat_exon2", "start": 8456, "end": 8552, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.5303030303030303, "protein": "RSTPQLRGDPTGPKESKEKVERETETDPVH", @@ -4802,8 +4802,8 @@ "name": "rev_exon2", "start": 8457, "end": 8733, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.3690449563855961, "protein": "DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE", @@ -4814,10 +4814,10 @@ "name": "nef", "start": 8876, "end": 9509, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4195274186357557, + "distance": 0.411658382286489, "protein": "MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC", "aminoacids": "MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*", "nucleotides": "ATGGGTGGCAAATGGTCAAAAAGTAAGCTATTTGGATGGCCTGCTGTAAGGGAAAGAATGAGAAGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACACGGAGCAATCACAAGTAGCAATACACCAACTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCGGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGATCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAATAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA" @@ -5133,9 +5133,9 @@ "start": 5536, "end": 5827, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5656050955414005, + "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS", "aminoacids": "MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAACTTAAAAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTTCATGGATTGGGACAGCATATCTATGAAACATATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCGACATAGCAGAATAGGCATTAATCTACAGAGGAGAGCAAGGAATGGATCCAGTAGATCCTAG" @@ -5144,8 +5144,8 @@ "name": "tat_exon1", "start": 5807, "end": 6026, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ", @@ -5156,8 +5156,8 @@ "name": "rev_exon1", "start": 5946, "end": 6027, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKFLYQSSK", @@ -5168,10 +5168,10 @@ "name": "vpu", "start": 6038, "end": 6284, - "subtype_start": 6259, - "subtype_end": 6310, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7548091006737623, + "distance": 0.5464940306036659, "protein": "MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL", "aminoacids": "MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*", "nucleotides": "ATGCGACCTTTAGAAATAGCAGCAATAGTAGCACTAGTAGTAGCAGTACTAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAGTGGATAGAATAAGAGAAAGAGCAGAAGATAGTGGAAATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAG" @@ -5180,10 +5180,10 @@ "name": "env", "start": 6201, "end": 8778, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.5096088152339575, + "distance": 0.5083167934238491, "protein": "MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL", "aminoacids": "MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAGTGCCACAGAGAACTTGTGGGTCACAGTCTACTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAGATGCCAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAGCCCACAAGAAGTAGTATTGAAAAATGTGACAGAAAAGTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATCAGGATATAATCAGTTTATGGGATGAAAGCCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATGCTACTATCAGTGGTAATGCAACAGAAGAAATAAAAAACTGCTCTTTCAATGTCAATACAAAAATAGGAGGTAAGAAGCAGAAAGAACGTGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAGTACTAATAGGACTAATACCAGCTATAGGTTGATAAGTTGTAACACTTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTGGAGATAAAGAGTTCAATGGAACAGGACTATGTAGAAATGTCAGCACAGTCCAATGTACACATGGAATCAGGCCAGTAGTATCAACTCAATTGCTGTTGAATGGCAGTCTAGCAGAAGGAGAGGTAGTAATTAAATCTGAAAATATCACGAACAATGTTAAAACCATAATAGTACAGCTAAATGAAACTGTATCAATTAATTGTACAAGACCTAGCAACAATACAAGAAGAAGCATACATATGGGACCAGGGAGAGCCTTTTATGCAACAGGAGAAATAATAGGAGATATAAGGAAAGCACAGTGTATCCTGAATAAGACAGACTGGAGTGACACTTTAACAAGGATAGCTAAAAAATTACACAAGCAATTTCATGGACCAATAGCATTTGAGCAATCCTCAGGAGGGGACCCTGAAATTACAATGCACACTTTTAATTGTGGAGGGGAATTTTTCTACTGCAACACATCAGCGTTGTTTAGCGGGACCTGGAATGGTACTGCTTGGACTAATGCTACTTGGGGTAATATTGCAGGTAACAATATCACACTCCAATGCAGAATAAAACAATTTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGAGAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGCAGTAACACAACAAATGGTGGCGAGAATGGGACCCAGATTGGCGAGAATGTGACCCAGATCTTCAGACCTGGAGGAGGGGATATGAGGGACAATTGGAGAAGTGAATTATACAAATATAAAGTAGTAAAAATTGAGCCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTAACATTCGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACACTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTTCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAAAAAATTTGGGGGAACATGACCTGGATGGAGTGGGAGAGAGAAATTGACAATTATACAGACTTAATATACACCTTAATTGAACAATCGCAGAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAGGCTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGTTTAGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTATCATTCCAGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGTTTGCTTAATGCTATAGCTATATCAGTAGCGGAGGGAACAGATAGGATTATAGAAGCAATACAAAGAATTTGTAGAGCTATCTTACACATACCTACAAGGATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA" @@ -5192,10 +5192,10 @@ "name": "tat_exon2", "start": 8359, "end": 8455, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.4542873367404884, + "distance": 0.4034761018001243, "protein": "RPASQPRGDPTGPKEPTKKVERETETDPDH", "aminoacids": "RPASQPRGDPTGPKEPTKKVERETETDPDH**", "nucleotides": "AGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGA" @@ -5204,8 +5204,8 @@ "name": "rev_exon2", "start": 8360, "end": 8636, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE", @@ -5216,10 +5216,10 @@ "name": "nef", "start": 8779, "end": 9406, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.5105263157894737, + "distance": 0.5049429657794677, "protein": "MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC", "aminoacids": "MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*", "nucleotides": "ATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAAGCCAGAAGATGAGCCAGCAGCAAATGGGGTGGGGGCAGCATCTCGAGACTTGGAGAAATATGGCGCACTCACAAGTAGCAATACAGTAGCTACTAATGCTGATTTAGCTTGGCTAGAAGCACAAGAGGAAGAGGAGGTGGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTCTAGATCTCAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGGTTCACCACACACAAGGCTATCTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACCCGGAGAAAGAAGTCTTAATGTGGAAGTTTGACAGCCACCTAGCATTCCGTCACATGGCCCGAGAGCTGCATCCGGAGTATTACAAAGACTGCTGA" @@ -5401,9 +5401,9 @@ "start": 5574, "end": 5865, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5793112277557293, + "distance": 0.3120665742024965, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAGAGGAACTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAACTTAGGACAATACATCTATGCAACTTATGGGGATACTTGGACAGGAGTGGAAGCTTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCAACATAGCAGAATAGGCATTACTCGACAGAGGAGAGCAAGGAATGGAGCCAGTAGATCCTAG" @@ -5412,8 +5412,8 @@ "name": "tat_exon1", "start": 5845, "end": 6064, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ", @@ -5424,44 +5424,44 @@ "name": "rev_exon1", "start": 5984, "end": 6065, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKQLYQSSK", "aminoacids": "MAGRSGDSDEDLLKTVRLIKQLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6076, + "end": 6340, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.4955621301775147, + "protein": "MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL", + "aminoacids": "MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL*", + "nucleotides": "ATGCAACCCTTAGTAATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAGAAAGATAGATAGCATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6239, "end": 8807, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.4718646278993922, + "distance": 0.4703403690377699, "protein": "MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL", "aminoacids": "MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*", "nucleotides": "ATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAGTGCTAAAGAACAATTGTGGGTCACAGTTTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAAATGCTAAAGCATATGACCCAGAGGTGCATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACAAGAAGTACCATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGACATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTATTTTAAATTGCACTAATGTGAATGTTACTACTAACAATAATAGTAGTAGTGAGGAACAGATGGAGGTAGGAGAAATAAAAAACTGCTCTTTCAATATTGCCACAAGAATAAAAAATAAGATAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAATAGAGGATGATAATACAAGCTATATGTTGATAAATTGTAATACCTCAGTCACTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATACTAAAATGTAATGATAAAAAGTTCAATGGAACAGGACCATGTAACAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGATAGTAGTTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTGAATAAAACTATAGAAATTAATTGTATAAGACCCAACAATAATACAAGAAAAAGTATATCTTTAAGACCGGGGCAAGCAATTTATGCAACAGAAGACATAATAGGAAATATAAGACAAGCACATTGTAACATTAGGAGAAAAGACTGGGATAAAGCTTTAGAACAGGTAGTTGCAAAATTAAGAGAACAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGAGACCCAGAAATTGTAATGCATAGTTTTAATTGTGCAGGGGAATTTTTCTACTGTAACACAACAAAGCTGTTTAATAGTACTTGGAATGTTAATAACACTCGGAATAATACTACTGATAATAGCACCATCACTCTCCCGTGCAGAATAAAACAAATTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCTCCTCCCATCAAAGGGCAAATTAAATGTTCATCAAATATTACAGGGTTATTATTAACAAGAGATGGTGGTGTCCGCGAGGACAACGCCCCTGAGATCTTTAGACCTGGAGGAGGAGATATGAGGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTGGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAAAGAGGAAAAAGAGCAGTAACGCTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACTTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTACCTTGGAATACTAGTTGGAGTAATAAATCTTTGGAAAAGATTTGGAAAAACATGACCTGGATGGAGTGGGAGAAAGAAATTAACAATTACACAAGGACAATATACACCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAGGAATTATTGGAATTGGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATCATGATAGTAGGAGGTATAGTAGGGTTAAGAATAGTTTTTACTGTGCTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTGTCATTCCAGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAGTTTGCTTAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAATTGGTAGAGCTATTCTCCACATCCCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 6283, - "end": 6340, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.4380664652567977, - "protein": "MGHHVEMGHHAPWNVDDL", - "aminoacids": "MGHHVEMGHHAPWNVDDL*", - "nucleotides": "ATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8388, "end": 8484, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPASQLRGDQTGPKEQKKKVERETETDPGN", @@ -5472,8 +5472,8 @@ "name": "rev_exon2", "start": 8389, "end": 8674, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.4123815285339786, "protein": "DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC", @@ -5484,10 +5484,10 @@ "name": "nef", "start": 8808, "end": 9417, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.49080954243253805, + "distance": 0.484764542936288, "protein": "MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC", "aminoacids": "MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAATGTAGTCTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCTCCAGCAGCAGAAGGGGTGGGAGCAGCATCTCGAGACTTGGAAAAACATGGAGCACTCACAACTAGTAATACAGCAGCTAATAATGCTGCTTGTGCCTGGCTGGAAGCACAAGAGGAGGAAGAGGTGGGGTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGGAGCTATGGATCTTGGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCCAAAAAGACAAGAAATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTATACACCAGGGCCAGGGACTAGATATCCATTAACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATGAAGGAGAGAATAGCTGTTTGCTACACCCGATGAACCAGCATGGGGCAGATGACACAGAAAGAGAAGTATTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAAGGCCCGAGAGCTGCATCCGGAGTACTACAAAAACTGCTGA" diff --git a/tests/expected-results-single-csv/blast.csv b/tests/expected-results-single-csv/blast.csv index 6830cf2..cd13240 100644 --- a/tests/expected-results-single-csv/blast.csv +++ b/tests/expected-results-single-csv/blast.csv @@ -1,4 +1,4 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9753,1,9689,1,9719,0.0,11990,93.264,9096,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC2-T6GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC32TC1AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA31CA36GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,1,616,9086,9719,0.0,760,92.283,586,plus,24AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9752,1,9689,1,9718,0.0,12000,93.294,9098,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC8GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC34AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA30TC37GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,1,616,9085,9718,0.0,763,92.441,587,plus,24AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 diff --git a/tests/expected-results-single-csv/errors.csv b/tests/expected-results-single-csv/errors.csv index 8a1c252..1378841 100644 --- a/tests/expected-results-single-csv/errors.csv +++ b/tests/expected-results-single-csv/errors.csv @@ -1,3 +1 @@ sequence_name,error,message -MN692145,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MN692145,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 231" diff --git a/tests/expected-results-single-csv/holistic.csv b/tests/expected-results-single-csv/holistic.csv index d3d8de7..57ad129 100644 --- a/tests/expected-results-single-csv/holistic.csv +++ b/tests/expected-results-single-csv/holistic.csv @@ -1,2 +1,2 @@ seqid,qlen,hypermutation_probablility,inferred_subtype,blast_matched_qlen,blast_sseq_coverage,blast_qseq_coverage,blast_sseq_orfs_coverage,orfs_start,orfs_end,blast_n_conseqs -MN692145,9689,0.1661041079701131,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.1304660973351168,1.1271545051088863,1.0,789,8795,3 +MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8794,3 diff --git a/tests/expected-results-single-csv/intact.fasta b/tests/expected-results-single-csv/intact.fasta index e69de29..1f7afc5 100644 --- a/tests/expected-results-single-csv/intact.fasta +++ b/tests/expected-results-single-csv/intact.fasta @@ -0,0 +1,163 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-single-csv/nonintact.fasta b/tests/expected-results-single-csv/nonintact.fasta index 1f7afc5..e69de29 100644 --- a/tests/expected-results-single-csv/nonintact.fasta +++ b/tests/expected-results-single-csv/nonintact.fasta @@ -1,163 +0,0 @@ ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-single-csv/orfs.csv b/tests/expected-results-single-csv/orfs.csv index e41779e..5c8fb54 100644 --- a/tests/expected-results-single-csv/orfs.csv +++ b/tests/expected-results-single-csv/orfs.csv @@ -2,11 +2,11 @@ seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,amin MN692145,gag,775,2281,789,2292,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN692145,pol,2070,5085,2084,5096,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN692145,vif,5029,5608,5040,5619,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG -MN692145,vpr,5547,5838,5558,5843,forward,0.587876570313453,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG -MN692145,tat_exon1,5818,6037,5830,6046,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN692145,rev_exon1,5957,6038,5969,6047,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN692145,env,6212,8783,6224,8795,forward,0.47520309038232134,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MN692145,vpu,6253,6298,6259,6310,forward,0.3649167733674775,MEMGHHAPWDVDDL,MEMGHHAPWDVDDL*,ATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG -MN692145,tat_exon2,8364,8460,8376,8469,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -MN692145,rev_exon2,8365,8641,8377,8653,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG -MN692145,nef,8784,9387,8796,9417,forward,0.4049958673891082,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA +MN692145,vpr,5547,5838,5558,5849,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG +MN692145,tat_exon1,5818,6037,5829,6045,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6038,5968,6046,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6298,6060,6309,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8783,6223,8794,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8460,8375,8471,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8641,8376,8652,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9387,8795,9416,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA diff --git a/tests/expected-results-single/blast.csv b/tests/expected-results-single/blast.csv index 6830cf2..cd13240 100644 --- a/tests/expected-results-single/blast.csv +++ b/tests/expected-results-single/blast.csv @@ -1,4 +1,4 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9753,1,9689,1,9719,0.0,11990,93.264,9096,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC2-T6GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC32TC1AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA31CA36GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,1,616,9086,9719,0.0,760,92.283,586,plus,24AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9752,1,9689,1,9718,0.0,12000,93.294,9098,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC8GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC34AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA30TC37GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,1,616,9085,9718,0.0,763,92.441,587,plus,24AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 diff --git a/tests/expected-results-single/errors.json b/tests/expected-results-single/errors.json index 292cbf8..abf6ec8 100644 --- a/tests/expected-results-single/errors.json +++ b/tests/expected-results-single/errors.json @@ -1,14 +1,3 @@ { - "MN692145": [ - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MN692145", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 231" - } - ] + "MN692145": [] } \ No newline at end of file diff --git a/tests/expected-results-single/holistic.json b/tests/expected-results-single/holistic.json index 060aa5a..9a1c5bf 100644 --- a/tests/expected-results-single/holistic.json +++ b/tests/expected-results-single/holistic.json @@ -1,14 +1,14 @@ { "MN692145": { "qlen": 9689, - "hypermutation_probablility": 0.1661041079701131, + "hypermutation_probablility": 0.1672411051048176, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9689, - "blast_sseq_coverage": 1.1304660973351168, + "blast_sseq_coverage": 1.130479522535501, "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-single/intact.fasta b/tests/expected-results-single/intact.fasta index e69de29..1f7afc5 100644 --- a/tests/expected-results-single/intact.fasta +++ b/tests/expected-results-single/intact.fasta @@ -0,0 +1,163 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-single/nonintact.fasta b/tests/expected-results-single/nonintact.fasta index 1f7afc5..e69de29 100644 --- a/tests/expected-results-single/nonintact.fasta +++ b/tests/expected-results-single/nonintact.fasta @@ -1,163 +0,0 @@ ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-single/orfs.json b/tests/expected-results-single/orfs.json index 3da162b..3c10e8a 100644 --- a/tests/expected-results-single/orfs.json +++ b/tests/expected-results-single/orfs.json @@ -41,9 +41,9 @@ "start": 5547, "end": 5838, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.587876570313453, + "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", "aminoacids": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG" @@ -52,8 +52,8 @@ "name": "tat_exon1", "start": 5818, "end": 6037, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -64,44 +64,44 @@ "name": "rev_exon1", "start": 5957, "end": 6038, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6049, + "end": 6298, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.520618556701031, + "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", + "aminoacids": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*", + "nucleotides": "ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6212, "end": 8783, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.47520309038232134, + "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", "aminoacids": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 6253, - "end": 6298, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.3649167733674775, - "protein": "MEMGHHAPWDVDDL", - "aminoacids": "MEMGHHAPWDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8364, "end": 8460, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -112,8 +112,8 @@ "name": "rev_exon2", "start": 8365, "end": 8641, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -124,10 +124,10 @@ "name": "nef", "start": 8784, "end": 9387, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4049958673891082, + "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", "aminoacids": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA" diff --git a/tests/expected-results-small-csv/blast.csv b/tests/expected-results-small-csv/blast.csv index 530b4f1..026de93 100644 --- a/tests/expected-results-small-csv/blast.csv +++ b/tests/expected-results-small-csv/blast.csv @@ -1,18 +1,18 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,9386,9635,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,180,1,180,9540,9719,2.04e-69,259,100.000,180,plus,180 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,9497,1,9493,151,9632,0.0,13151,98.473,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG229-T41AG5AG81CA45GA54CG3CA3AGGA18TC32TC11AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA85AG143AG14GA38TC52AG146GA285GA25AG11TC47GA58AG11TG181GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,484,1,484,9236,9719,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,634,1,634,9086,9719,0.0,813,94.795,601,plus,14TCGAGC5GA1AG56GA21GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,9488,9579,2.15e-30,131,98.913,91,plus,18GC73 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9753,1,9689,1,9719,0.0,11990,93.264,9096,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC2-T6GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC32TC1AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA31CA36GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,1,616,9086,9719,0.0,760,92.283,586,plus,24AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,8446,666,9069,1323,9673,0.0,9611,90.161,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC2-T17AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG9TC4TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC46GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC13GA3AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,9385,9634,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,180,1,180,9539,9718,2.04e-69,259,100.000,180,plus,180 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,9496,1,9493,151,9631,0.0,13155,98.484,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG270AG5AG81CA45GA54CG3CA3AGGA18TC44AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA24TCAC59AG143AG14GA38TC52AG146GA311AG11TC47GA58AG11TG181GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,484,1,484,9235,9718,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,634,1,634,9085,9718,0.0,816,94.953,602,plus,14TCGAGC5GA1AG78GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,9487,9578,2.15e-30,131,98.913,91,plus,18GC73 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9752,1,9689,1,9718,0.0,12000,93.294,9098,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC8GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC34AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA30TC37GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,1,616,9085,9718,0.0,763,92.441,587,plus,24AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,8445,666,9069,1323,9672,0.0,9616,90.172,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC19AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG14TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC16TCAC28GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC17AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 diff --git a/tests/expected-results-small-csv/errors.csv b/tests/expected-results-small-csv/errors.csv index 6f92714..39f058b 100644 --- a/tests/expected-results-small-csv/errors.csv +++ b/tests/expected-results-small-csv/errors.csv @@ -1,34 +1,32 @@ sequence_name,error,message KX505501.1,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 2721" -KX505501.1,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6323 +KX505501.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6322 KX505501.1,InsertionInOrf,"Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" -KX505501.1,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 195 positions. -KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893 -KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5969-6047 contains an internal stop codon at 6005 -KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 40 positions. -KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 96" -KX505501.1,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1116" +KX505501.1,DeletionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" +KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 +KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004 +KX505501.1,FrameshiftInOrf,Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions. +KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions. +KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" +KX505501.1,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" KX505501.1,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. KX505501.1,LongDeletion,Query sequence contains a long deletion. KX505501.1,Scramble,Sequence is plus-scrambled. -MN691959,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MN691959,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" +MN691959,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123 +MN691959,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 MN692074,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 981" -MN692074,InternalStopInOrf,ORF env at 6224-8795 contains an internal stop codon at 6551 +MN692074,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6550 MN692074,DeletionInOrf,"Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" -MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5843 can have maximum insertions 90, got 261" -MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893 -MN692074,InsertionInOrf,"Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 108" -MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 76 positions. -MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 204" -MN692074,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1131" +MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" +MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 +MN692074,InsertionInOrf,"Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" +MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions. +MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" +MN692074,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" MN692074,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. MN692074,LongDeletion,Query sequence contains a long deletion. -MN692145,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions. -MN692145,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 231" MN090335,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 822 -MN090335,FrameshiftInOrf,Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions. -MN090335,InsertionInOrf,"Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 282" +MN090335,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 MN090335,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 42 deletions with max tolerance of 10 deletions. MN090335,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, AT." MN090335,Scramble,Sequence is minus-scrambled. diff --git a/tests/expected-results-small-csv/holistic.csv b/tests/expected-results-small-csv/holistic.csv index 0dd3a51..352edd3 100644 --- a/tests/expected-results-small-csv/holistic.csv +++ b/tests/expected-results-small-csv/holistic.csv @@ -1,6 +1,6 @@ seqid,qlen,hypermutation_probablility,inferred_subtype,blast_matched_qlen,blast_sseq_coverage,blast_qseq_coverage,blast_sseq_orfs_coverage,orfs_start,orfs_end,blast_n_conseqs -KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498199403230785,1.2158237356034052,0.17661753684736448,789,8795,4 -MN691959,9493,0.19593905853945925,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0816956477003807,1.1086063415148004,1.0,789,8795,3 -MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5041670953801831,1.1728099569171853,0.41144141893579816,789,8795,4 -MN692145,9689,0.1661041079701131,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.1304660973351168,1.1271545051088863,1.0,789,8795,3 -MN090335,9069,0.1754017863888554,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842576396748637,1.0603153600176425,1.0003747189607795,789,8795,3 +KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498456472525211,1.2158237356034052,0.17663960024984385,789,8794,4 +MN691959,9493,0.19667690182893238,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0817040543321672,1.1086063415148004,1.0,789,8794,3 +MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5042189750977567,1.1728099569171853,0.4114928169893816,789,8794,4 +MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8794,3 +MN090335,9069,0.1771850809736527,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842560197571517,1.0603153600176425,1.0003747657713928,789,8794,3 diff --git a/tests/expected-results-small-csv/intact.fasta b/tests/expected-results-small-csv/intact.fasta index e69de29..1f7afc5 100644 --- a/tests/expected-results-small-csv/intact.fasta +++ b/tests/expected-results-small-csv/intact.fasta @@ -0,0 +1,163 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-small-csv/nonintact.fasta b/tests/expected-results-small-csv/nonintact.fasta index 94eb85d..1baa046 100644 --- a/tests/expected-results-small-csv/nonintact.fasta +++ b/tests/expected-results-small-csv/nonintact.fasta @@ -264,169 +264,6 @@ ACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGAT TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTC ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA >MN090335 GGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGGCTCCTTCTGATAA TGCTGAAAACATGGGTATTACTTCTGGGCTGAAAGCCTTTTCTTCTACTACTTTTACCCA diff --git a/tests/expected-results-small-csv/orfs.csv b/tests/expected-results-small-csv/orfs.csv index 4880772..a5fce96 100644 --- a/tests/expected-results-small-csv/orfs.csv +++ b/tests/expected-results-small-csv/orfs.csv @@ -1,56 +1,56 @@ seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides -KX505501.1,env,0,1824,6224,8795,forward,0.7626080297560442,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,env,0,1824,6223,8794,forward,0.7623480451210163,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG KX505501.1,vif,0,1824,5040,5619,forward,0.7647696476964769,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,nef,0,1824,8796,9417,forward,0.7645782478980201,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,tat_exon1,1,1750,5830,6046,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,nef,0,1824,8795,9416,forward,0.764345579086969,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,tat_exon1,1,1750,5829,6045,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT KX505501.1,gag,336,1824,789,2292,forward,0.3997973809613161,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon1,1306,1750,5969,6047,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT -KX505501.1,vpr,1599,1824,5558,5843,forward,0.7638478800047243,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon1,1306,1750,5968,6046,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,vpr,1599,1824,5558,5849,forward,0.763687959047407,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vpu,1599,1824,6060,6309,forward,0.7672672672672673,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG KX505501.1,pol,1627,1927,2084,5096,forward,0.7724330674761569,GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,IL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -KX505501.1,tat_exon2,1746,1824,8376,8469,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon2,1747,1927,8377,8653,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -KX505501.1,vpu,1748,1778,6259,6310,forward,0.7688723205964585,MHPEYYKDC,MHPEYYKDC*,ATGCATCCGGAGTACTACAAGGACTGCTGA +KX505501.1,tat_exon2,1746,1824,8375,8471,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon2,1747,1927,8376,8652,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA MN691959,gag,639,2142,789,2292,forward,0.0801186943620179,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN691959,pol,1934,4946,2084,5096,forward,0.054722889368558514,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN691959,vif,4890,5469,5040,5619,forward,0.09157509157509158,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG -MN691959,vpr,5408,5699,5558,5843,forward,0.5391891891891883,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MN691959,tat_exon1,5679,5898,5830,6046,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN691959,rev_exon1,5818,5899,5969,6047,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN691959,env,6070,8656,6224,8795,forward,0.13638128518734216,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA -MN691959,vpu,6105,6156,6259,6310,forward,0.2321981424148607,MGVEMGHHAPWDIDDL,MGVEMGHHAPWDIDDL*,ATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG -MN691959,tat_exon2,8237,8333,8376,8469,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA -MN691959,rev_exon2,8238,8514,8377,8653,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG -MN691959,nef,8657,9278,8796,9417,forward,0.08588605782994552,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA -MN692074,nef,0,4059,8796,9417,forward,0.763072203234748,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG -MN692074,env,2,4115,6224,8795,forward,0.7604257801108195,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpu,2,2084,6259,6310,forward,0.7659115426105717,MGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAA +MN691959,vpr,5408,5699,5558,5849,forward,0.09157509157509158,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MN691959,tat_exon1,5679,5898,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN691959,rev_exon1,5818,5899,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN691959,vpu,5910,6156,6060,6309,forward,0.7333193453629878,MQPIQIAIVALVVAIIIAIVV,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG +MN691959,env,6070,8656,6223,8794,forward,0.1405525502318391,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA +MN691959,tat_exon2,8237,8333,8375,8471,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA +MN691959,rev_exon2,8238,8514,8376,8652,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG +MN691959,nef,8657,9278,8795,9416,forward,0.06582796957284964,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA +MN692074,nef,0,4059,8795,9416,forward,0.7628009106462086,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG +MN692074,env,2,4115,6223,8794,forward,0.76033143808071,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA MN692074,gag,789,2292,789,2292,forward,0.19470123431286457,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN692074,pol,2084,4115,2084,5096,forward,0.5617851221088768,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA MN692074,vif,3617,4115,5040,5619,forward,0.7631664499349805,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpr,3617,4115,5558,5843,forward,0.7635778016363703,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,tat_exon1,3823,4084,5830,6046,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,rev_exon1,3823,4084,5969,6047,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,tat_exon2,4080,4164,8376,8469,forward,0.7699443413729128,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA -MN692074,rev_exon2,4081,4153,8377,8653,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG +MN692074,vpr,3617,4115,5558,5849,forward,0.7629151983204618,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpu,3617,4115,6060,6309,forward,0.7634058115037564,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,tat_exon1,3823,4084,5829,6045,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,rev_exon1,3823,4084,5968,6046,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,tat_exon2,4080,4164,8375,8471,forward,0.769292994661058,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,rev_exon2,4081,4153,8376,8652,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG MN692145,gag,775,2281,789,2292,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA MN692145,pol,2070,5085,2084,5096,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN692145,vif,5029,5608,5040,5619,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG -MN692145,vpr,5547,5838,5558,5843,forward,0.587876570313453,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG -MN692145,tat_exon1,5818,6037,5830,6046,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN692145,rev_exon1,5957,6038,5969,6047,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN692145,env,6212,8783,6224,8795,forward,0.47520309038232134,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MN692145,vpu,6253,6298,6259,6310,forward,0.3649167733674775,MEMGHHAPWDVDDL,MEMGHHAPWDVDDL*,ATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG -MN692145,tat_exon2,8364,8460,8376,8469,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -MN692145,rev_exon2,8365,8641,8377,8653,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG -MN692145,nef,8784,9387,8796,9417,forward,0.4049958673891082,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA +MN692145,vpr,5547,5838,5558,5849,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG +MN692145,tat_exon1,5818,6037,5829,6045,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6038,5968,6046,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6298,6060,6309,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8783,6223,8794,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8460,8375,8471,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8641,8376,8652,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9387,8795,9416,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA MN090335,gag,315,1665,789,2292,forward,0.596665989022159,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA MN090335,pol,1427,4469,2084,5096,forward,0.27887169154684477,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG MN090335,vif,4413,4992,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MN090335,vpr,4931,5222,5558,5843,forward,0.6083541998634192,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG -MN090335,tat_exon1,5202,5421,5830,6046,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA -MN090335,rev_exon1,5341,5422,5969,6047,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG -MN090335,env,5596,8158,6224,8795,forward,0.5139610675592354,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA -MN090335,vpu,5643,5682,6259,6310,forward,0.5690703735881842,MGHDAPWDVDDL,MGHDAPWDVDDL*,ATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG -MN090335,tat_exon2,7739,7835,8376,8469,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA -MN090335,rev_exon2,7740,8016,8377,8653,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG -MN090335,nef,8159,8813,8796,9417,forward,0.49485619884358334,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +MN090335,vpr,4931,5222,5558,5849,forward,0.3808935556928146,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG +MN090335,tat_exon1,5202,5421,5829,6045,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA +MN090335,rev_exon1,5341,5422,5968,6046,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG +MN090335,vpu,5433,5682,6060,6309,forward,0.5244381020335356,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG +MN090335,env,5596,8158,6223,8794,forward,0.5152420275849952,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA +MN090335,tat_exon2,7739,7835,8375,8471,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA +MN090335,rev_exon2,7740,8016,8376,8652,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG +MN090335,nef,8159,8813,8795,9416,forward,0.4891015417331206,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA diff --git a/tests/expected-results-small/blast.csv b/tests/expected-results-small/blast.csv index 530b4f1..026de93 100644 --- a/tests/expected-results-small/blast.csv +++ b/tests/expected-results-small/blast.csv @@ -1,18 +1,18 @@ qseqid,sseqid,sgi,qlen,slen,length,qstart,qend,sstart,send,evalue,bitscore,pident,nident,sstrand,btop -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,251,1747,1997,9386,9635,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 -KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9719,180,1,180,9540,9719,2.04e-69,259,100.000,180,plus,180 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,9497,1,9493,151,9632,0.0,13151,98.473,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG229-T41AG5AG81CA45GA54CG3CA3AGGA18TC32TC11AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA85AG143AG14GA38TC52AG146GA285GA25AG11TC47GA58AG11TG181GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 -MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9719,484,1,484,9236,9719,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,634,1,634,9086,9719,0.0,813,94.795,601,plus,14TCGAGC5GA1AG56GA21GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 -MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9719,92,4087,4178,9488,9579,2.15e-30,131,98.913,91,plus,18GC73 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,9753,1,9689,1,9719,0.0,11990,93.264,9096,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC2-T6GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC32TC1AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA31CA36GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,1,616,9086,9719,0.0,760,92.283,586,plus,24AG12TC8AG34GA56TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9719,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,8446,666,9069,1323,9673,0.0,9611,90.161,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC2-T17AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG9TC4TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC46GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC13GA3AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 -MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9719,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,1751,1,1746,455,2202,0.0,2186,93.946,1645,plus,254-A7GA1AG35GA4T-T-68GA3AC17CT10AG5TG4GA7CT25AG33CT46GAAT1TC3AC21AGGA2TA2GA9AG5GATC12AG7AGAG5TGGA1GA17CT14AG16TG2GA4CA11AG1CA7-A-C-A5ACGATC4GA12CA9GA10T-3-C15TC8CA1GA5AT27AG4GA2AG20AG44CT17TC47TC27TG99CG36GA23AG2GA30GATC36TC32CT11AG5CTAT7AG35GA20AG17AG8AG2CT26CT8GA9AG7AG30AG1GA14ACGA12AG24AG1CT9CT25TC24AG25GA9TC11CT24GT7AG12CT13GA8CT7AG26CA14TC5AT7CA5 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,301,550,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,251,1747,1997,9385,9634,2.53e-85,312,93.625,235,plus,2AC15AT4GA10CTTC6TGTCCT30T-AG1GA42GC21CT9GTAG46GA49 +KX505501.1,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,1997,9718,180,1,180,9539,9718,2.04e-69,259,100.000,180,plus,180 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,9496,1,9493,151,9631,0.0,13155,98.484,9352,plus,13TG3GT7GA5TC56TG51GA129GC68TC84AG159AC359GC71CT3AG41GA79AG256YCWAYC2WA103AG146WA2AG38GA142TC72GT141TC52AG298TC8AG101AG125AG539AG65GA7GA4TC55GA2AG131GA13CT66TC25GA9AG38AG38CT11TC53TC50GA11CT1AG12GA6CA8AG263AG349AT21AG12AG313GA254ACAC26TC108GA105TC119AG270AG5AG81CA45GA54CG3CA3AGGA18TC44AC2-T-A-G49AG41GA69GA1GA51AG114GA215GAGA5CA3T-A-A-T-A-C-C-A-A-T-A-G-T-A-G-22GAAG6GA54AGAG24CT18GA30CA231TG16CT9AG33CAAC48TA99GACA225AC21TA17GA34CT61AG8GA207GC122AG68CT81AC3TC290AC4GA24TCAC59AG143AG14GA38TC52AG146GA311AG11TC47GA58AG11TG181GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,547,8947,9493,1,547,0.0,752,97.989,536,plus,23AC57GA37TC43TG3GT7GA5TC56TG51GA129GC68TC57 +MN691959,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9493,9718,484,1,484,9235,9718,0.0,676,98.760,478,plus,17GA58AG11TG181GC68TC84AG59 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,4082,1,4082,1,4082,0.0,5487,97.036,3961,plus,14TCGAGC5GAACAG56GA21GA4CT5TA23TA18TG9GT7GA5TCGACA11AC16AG1AG11GA5GT10AG10AGTA5AG56AT6TC7TA7ATTG77GC79GA48TC103TC12AG148TC1CG12CTACAG44GA154AG27AG7GA25GC3GA31GA27AC3AG2GACT125AG138TG4CT41GA92CT18AC22GA8TC59TC107GA17CG6TC31GA17AG14GT46AG20AG2GA2AT35TC29GA88CT22CT49TC5AT16GC41GA10AG33GA68AG195TC8AG101AG181GA33GT27AG4AC2TC5AG20CT4GT96TC29AC29AG14TC22TC12AG20AG6TC34CT110AG65GA21AG2GA11AG13GA17GA2AG26AG53TC61AG105AG11AG12GA52CT128CT21TA31AG12CT86 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,634,1,634,9085,9718,0.0,816,94.953,602,plus,14TCGAGC5GA1AG78GA3AGCT5TA23TA18TG5GT3GA14GACA11AC16AG1AG17GT10AG10AGTA5AG28AG27AT6TC7TA7ATTG77GC79GA48TC84 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,403,494,2.15e-30,131,98.913,91,plus,18GC73 +MN692074,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,4178,9718,92,4087,4178,9487,9578,2.15e-30,131,98.913,91,plus,18GC73 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,9752,1,9689,1,9718,0.0,12000,93.294,9098,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA153TC12AG13AC37AG40T-T-T-T-63AG9AG6GA36CA27AG3AG11TC27AT7AC32TC25AG51TGGA19AT5TC23GA6GA8AC1AG21AC7CT33CA1TC5CG11CT42AG28AG62TC41AG107CT65CT41GA8TC17TC17AG3TC10TC17CT14TC8CT48TG1AG20CT19GCAG38GA17AG8CT67GA6GA32GA5TC1TC81AG23AG12CT7GA8AG5CT11GA37TC5AT16TC14TC3CT2GA12T-C-C-7GA10AG106AG47TC24TCCT30GT56AG8TC11CT8TC8AG84AGCT15AG65TC17CT41AG11TC20GA11AC74GA2TC114TA127AGTC26TC109AC23AG11TG26TCGC7CT7AGAG14TC5GA3GA64GA6TC91GA48GA56GA4TA37GAGATC1AG11AG65CT65TC18TG4TC2AG33GA1CT11GA9TA44CT19AG66AC34AG11CA14CTTC58TC3AG7TC2AG38AT14CT47GA7GA84GA95AG14CT5CT41AT11TC8TCAG2AG4AG4AG21GA11GA5CA80CT17AG26TC147GA28TC26GA8CT34TC3AG119AG32AC27TCGA64TC40GA24CTAG1CA14GA20TC11AC13GATG3AT10TC8TC5TG41GA9TC24GA2GT6CA15GA1AG2GA45CA10TC1TCCA1GT62GT32CA18AG43CT2TC8GA10AG16AG3TC3CA9AG15AG37CT8GA12TACA30TC5CT8GA57TCCA3AGGA18TC34AC1CATC2TA3AC4TGCT13AT17CA19TC6TA40TC15AC3GT36GA2TACAATGAGTAC2AC3A-1CGATAGCG2CAATCGTGTGAG-G48GA3GACA2TA38AG46GA66GAAGGT5AT21TC7GA4CGCAAC29TC35GA2GA14CT1CG6TG12GAGAAGCA1GT2GT1GC-T-A-A8AG2AG2TG1AGCGAGGA3GTTG3-A-T-G11AG2GA21TACG1TA6AT1GA2AG6GT3TG13CT16GA2GA9GA4AG3A-G-A-3A-T-G-G-T-A-A-T-T-A-T-T-1TC7GA5TC9TC29AG5AC22TA15GT1AT12GA6GA4AGCAACAG41GA50TC34CT43CAAC14CA13GAGATC10TG2GA1GA1GAGA1TC1AGCT2GC-C-A-G-A-G-A10AGGA6TGAT1GA2GAGT2CG2TA2CT4GA4AG3AC12TA5AG2AG12CT1GATC7GA2TA1GA3TC1GACGAC8TA2GA6AG1GA-A-A-T13AT5CATG3CT28AG39AT5AC20ATAT1G-C-2CT1CG-T2AT1-G2TG2AC2GATAAGCGTG1GCGA3GA1TC5GA4AG1-G-A-C-A-C-A45GA34AT20CA12TC25GT1CGTC3GA1-T3CTA-A-C-A-C-C-A-10TC23AG40GA15GA66CT44AG1GC2GA3GA2TC40AG20AG17AG3TC23GA20GA8CG35TA36AC38GA3AG6GA1GTAC3TC18AC9GA1TC18TC2AT1TC6AGCA9GA1TA3AG6CA8AC7GA8GA13AG16GAGA9CT11CT6AT4TC20AG59CT22GA1TC5GA30TC37GACT2CG9AC4TC3AG13TA6AG50ATAG42TC9CT1TG5GA17CGAT72AG11TG5AG3TC2TG9CT1TG3TC2CA4CG18TG6GACT16GT21TG2GA12AC40GA12TC10TC6GA21TC9AG3AC8AC22AG129AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC20CT-T56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,1,616,9085,9718,0.0,763,92.441,587,plus,24AG12TC8AG91TA20-C-A-G-A-T-A-A-G-A-T-A-G-A-A-G-A-G-G3CA1GA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT8AT9GA34GA12AG27AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN692145,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9689,9718,635,9074,9689,1,634,0.0,752,91.811,583,plus,23ACAG12TC8AG34GA25GA30TA20-C-A-G-A-G-A-A-G-T-T-A-G-A-A-G-A-A-G3CATCGA1CAAG7TCGAAC3AC3CT1GA7CTAG8GT2GA5AT9GA34GA40AT23TG31G-21GA1AT22GC18-T2CT56GA134 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,8445,666,9069,1323,9672,0.0,9616,90.172,7615,plus,18GA5TC17TG5CT8TC18GATC31TG1AG108CA25GA20TC6CT38TC9AGGA5GA45TC17AT7AG35GA5AG2TC11AG17AG8AG38GA2GA14AG31CT4GAGA1AT4CT1AC4CA35CACT6AG28TC5AG44GA18GA5CT29AG11TCCT19C-T-2C-C-T-C-A-G-A-G-C-C-G-A-C-C-A-G-A-A-A-3CT28C-C-A-G-C-C-C-C-T-19TC5AT2-A-G-A11TC14AC1AG2GA8GA5T-C-C-4CT13AG20AC38TC34GA2CA2AGGAAG11AG51AG5AT3GA3CT9TCAT1CT5CT17GA51CA11CT13CT11AG32CT8GA17AG41AG59GA20TCGA1CT53AC9AG10TA11TC6CT19CA45AG13AG59TC14AG44GA3CT1GA14GAACCA69AG12GA7AG5GA9AT11TC19GA2CT11CT17GT15AG25AG11GA2AC2TC32AG5AG20TCGC13GA1AG12GA8GA12TC11GA43GA14TA2GA10CTAG12GT4GA15CA13AGGC4TC2GA47GA13CT12TC14GA27TA10TC16GA14GA1TC1AG11AG26TG20CT17CT2CT35AG12AG37TC5TG1AC5CT22GA16GA9AC3AC18AG5AG8CA3CT7CT14GACT28GA11GA21AC21GA12AG26CT11GA5CA26GA9CT46AT2AG8AT2CA27AG22AG6AG55TC8GA20TA8GA22AG4AG49GT11GA8AG11CT3AC8CT34AT9CA11AG2AGAC3AG2GT1AG39TA17GA29TA110AG41AC5GA34CA31GA28TC38CT35AG91TC11AG5AGAG6CT1AGAGAGAG4GTCT9CT2TC2CT4CG1AC28TC16AC42GA17CT23AG4GA27CATC10TA9GC2CT4TC5TC11AC14TG3AT10TC1GT67AG5GT13GA26AT1AC53AG6TC28AG10GAAT17CT5AGCACTAT5AC2AT1AG1CT4AG3TC29AG35AC10TC19AGCA15AG2GATC2TGGA2AG2AG26AC38GAGA3CG46GT5TC3CAAC43AC8TG3CA3AGGA18TC1CT5CT14AG14TC2TA2GCACGA3TG26GACT22AT8GAGT39TC1AGAGAT5AG5AC3GT30CT5G-G-A-T-C-A-G-G-A-4TA1GA11-G-G-A-G-A-T-G-G-G6AG9GC33GA1GA5TA37GAAG2TA4ACTC11CT32AG44TC8TA7AT4AGAT21TC12AG7GA2CA22AG29CT6GA16CG6TG11AG1GAAG9G-T-A-G-G-2ATTA1AC2CT1AGATTACG1CAAG1TG1AG1-G1CA1AG2A-C-3AGCG2GAGA1AG4AG2GA1CA20CG4GAAGGC7AG3AG4GAAG6CT5CT17GA1CA2GA10GAGT4AC3AC2TC4CAAG4TC2AG3CT2TC33AT7AG21AG1TC2AG11AG8GA5GTGA2GA3TC23ACGA35AG8GA11AG11TC2CT9AG5AG5CA9ATAC8AG7GC5ACTC14AG2TC1GC4AG3TA39TA2ACAC2GA1-C-C2-A-G-A-G-G-A-C11AT2TGAT1GA3CT3GACA1G-A-T-7GA4AG20CT3G-3-G2GA1TA6GA9GACAAC1AG4TC1GAAGAC8GA3AC10ATGA19TG5AC12ACTCGA7AT42CTAT6GA19ATGT1GATA2AG1-A-C-T-T3-G-T3-G-A2-G-G-T2TA1-T3-A-C-T-G-A-A4CG1AG1AC1ACTA5AC5GA25GT7GA28TC8GAACTA6GA2CT17AG2AGAC21C-A-A-3AGTC1G-T-3G-1GT3AT1GC4CT15GA3AG6AG30CT17GA27CA32AG1AG3GAC-G-T-8AT7CT38GC3CA16AG29AG12CT29AC28AG15GA5TG17CA56AG14AG10CT9TCATCG2TAACCACG2CT3GA2AC3TC10CG17CA1AC9GA1GCATAT4TC2ATAC4CA4GA10TA3AG2GA12AC1GA8AG3CT5CA9AG17GATC8AT18AT25AG10AG4AG11TC31CT11AG2GT7TA21AC16TCAC28GA7GAGTATAC9CATC4TC3AGCG4CT11CT31AG24GACATC5CT4CG2GC9AG12GAAGTC6GA2CT7GA6GA10TG37AG3TC3TC2CA14AG17GA4GT4AG2AGTC1GT1CT6TA3TG15GA11AC2AG6GACT5AT4AG21GA2TA2AG2GACT28G-A-A-2A-A-T-T-G-A-T-C-C-A-A-G-G-C-C-T-G-C-T-G-C-A-A-G-G-A-G-G-G-A-2AG17CA1GA4AG18TC8TC26TG2AG4TC41AG2AG2CT10GC33AG6TG1GA48TCGAGC5GA11AT9TC5GA1TC14AC17AG14AG13TA23TA18TG5CTCA1AGGA4GAAG8GA12AC1TA5CT8AG19AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TCAGGTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,627,46,669,1326,700,0.0,792,94.258,591,minus,33TC20TC68TG1GT16AT7AG3GATC3GACTCTTG4TG15CT11CT31CT9CA19CTAC6TC7TC14GT63TC3AG3CT3TC8CT43TC30CT37CT7TG18CT53AT1-T-T-T55 +MN090335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,0,9069,9718,588,8482,9069,1,588,0.0,673,89.966,529,plus,14TCGAGC5GAAC10AT9TC5GA1TC14AC13GA3AG14AG6GA6TA23TA18TG5CGCA1AGGT4GAAG1GA5TCGA12AC1TA5CT8AG13GA5AT3TC1AG3GA11AGTA5AG10AC4GA2GA8TC1GTAG8AG1ATAG13AT3AGGA10CTTC5ATTG37TC16CT22GC21CT24GA120 diff --git a/tests/expected-results-small/errors.json b/tests/expected-results-small/errors.json index d1facf1..e0159fe 100644 --- a/tests/expected-results-small/errors.json +++ b/tests/expected-results-small/errors.json @@ -8,7 +8,7 @@ { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6323" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6322" }, { "sequence_name": "KX505501.1", @@ -17,33 +17,38 @@ }, { "sequence_name": "KX505501.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 195 positions." + "error": "DeletionInOrf", + "message": "Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893" + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon1 at 5969-6047 contains an internal stop codon at 6005" + "message": "Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004" + }, + { + "sequence_name": "KX505501.1", + "error": "FrameshiftInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions." }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 40 positions." + "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions." }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 96" + "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1116" + "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" }, { "sequence_name": "KX505501.1", @@ -64,13 +69,13 @@ "MN691959": [ { "sequence_name": "MN691959", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123" }, { "sequence_name": "MN691959", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 249" + "error": "InternalStopInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" } ], "MN692074": [ @@ -82,7 +87,7 @@ { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "ORF env at 6224-8795 contains an internal stop codon at 6551" + "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" }, { "sequence_name": "MN692074", @@ -92,32 +97,32 @@ { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpr at 5558-5843 can have maximum insertions 90, got 261" + "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5830-6046 contains an internal stop codon at 5893" + "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6259-6310 can have maximum insertions 90, got 108" + "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8376-8469 contains out of frame indels that impact 76 positions." + "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions." }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8377-8653 can have maximum deletions 30, got 204" + "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 1131" + "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" }, { "sequence_name": "MN692074", @@ -130,18 +135,7 @@ "message": "Query sequence contains a long deletion." } ], - "MN692145": [ - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 75 positions." - }, - { - "sequence_name": "MN692145", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 231" - } - ], + "MN692145": [], "MN090335": [ { "sequence_name": "MN090335", @@ -150,13 +144,8 @@ }, { "sequence_name": "MN090335", - "error": "FrameshiftInOrf", - "message": "Smaller ORF vpr at 5558-5843 contains out of frame indels that impact 76 positions." - }, - { - "sequence_name": "MN090335", - "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8796-9417 can have maximum insertions 90, got 282" + "error": "InternalStopInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" }, { "sequence_name": "MN090335", diff --git a/tests/expected-results-small/holistic.json b/tests/expected-results-small/holistic.json index f80f6bf..b652f68 100644 --- a/tests/expected-results-small/holistic.json +++ b/tests/expected-results-small/holistic.json @@ -4,23 +4,23 @@ "hypermutation_probablility": 0.7087072014754221, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 1997, - "blast_sseq_coverage": 0.2498199403230785, + "blast_sseq_coverage": 0.2498456472525211, "blast_qseq_coverage": 1.2158237356034052, - "blast_sseq_orfs_coverage": 0.17661753684736448, + "blast_sseq_orfs_coverage": 0.17663960024984385, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 4 }, "MN691959": { "qlen": 9493, - "hypermutation_probablility": 0.19593905853945925, + "hypermutation_probablility": 0.19667690182893238, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9493, - "blast_sseq_coverage": 1.0816956477003807, + "blast_sseq_coverage": 1.0817040543321672, "blast_qseq_coverage": 1.1086063415148004, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MN692074": { @@ -28,35 +28,35 @@ "hypermutation_probablility": 0.36378645339477633, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 4178, - "blast_sseq_coverage": 0.5041670953801831, + "blast_sseq_coverage": 0.5042189750977567, "blast_qseq_coverage": 1.1728099569171853, - "blast_sseq_orfs_coverage": 0.41144141893579816, + "blast_sseq_orfs_coverage": 0.4114928169893816, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 4 }, "MN692145": { "qlen": 9689, - "hypermutation_probablility": 0.1661041079701131, + "hypermutation_probablility": 0.1672411051048176, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9689, - "blast_sseq_coverage": 1.1304660973351168, + "blast_sseq_coverage": 1.130479522535501, "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 }, "MN090335": { "qlen": 9069, - "hypermutation_probablility": 0.1754017863888554, + "hypermutation_probablility": 0.1771850809736527, "inferred_subtype": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455", "blast_matched_qlen": 9069, - "blast_sseq_coverage": 0.9842576396748637, + "blast_sseq_coverage": 0.9842560197571517, "blast_qseq_coverage": 1.0603153600176425, - "blast_sseq_orfs_coverage": 1.0003747189607795, + "blast_sseq_orfs_coverage": 1.0003747657713928, "orfs_start": 789, - "orfs_end": 8795, + "orfs_end": 8794, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-small/intact.fasta b/tests/expected-results-small/intact.fasta index e69de29..1f7afc5 100644 --- a/tests/expected-results-small/intact.fasta +++ b/tests/expected-results-small/intact.fasta @@ -0,0 +1,163 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-small/nonintact.fasta b/tests/expected-results-small/nonintact.fasta index 94eb85d..1baa046 100644 --- a/tests/expected-results-small/nonintact.fasta +++ b/tests/expected-results-small/nonintact.fasta @@ -264,169 +264,6 @@ ACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGAT TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTC ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA >MN090335 GGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGGCTCCTTCTGATAA TGCTGAAAACATGGGTATTACTTCTGGGCTGAAAGCCTTTTCTTCTACTACTTTTACCCA diff --git a/tests/expected-results-small/orfs.json b/tests/expected-results-small/orfs.json index acad930..0e30b50 100644 --- a/tests/expected-results-small/orfs.json +++ b/tests/expected-results-small/orfs.json @@ -4,10 +4,10 @@ "name": "env", "start": 0, "end": 1824, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.7626080297560442, + "distance": 0.7623480451210163, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", "nucleotides": "GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" @@ -28,10 +28,10 @@ "name": "nef", "start": 0, "end": 1824, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.7645782478980201, + "distance": 0.764345579086969, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", "nucleotides": "GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" @@ -40,8 +40,8 @@ "name": "tat_exon1", "start": 1, "end": 1750, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7680130480667754, "protein": "MRKLQNGIDCIQCMQGLLHQAR", @@ -64,8 +64,8 @@ "name": "rev_exon1", "start": 1306, "end": 1750, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.758082497212932, "protein": "MRTQIVKLF", @@ -77,9 +77,21 @@ "start": 1599, "end": 1824, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, + "orientation": "forward", + "distance": 0.763687959047407, + "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", + "aminoacids": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", + "nucleotides": "ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" + }, + { + "name": "vpu", + "start": 1599, + "end": 1824, + "subtype_start": 6060, + "subtype_end": 6309, "orientation": "forward", - "distance": 0.7638478800047243, + "distance": 0.7672672672672673, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", "nucleotides": "ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG" @@ -100,8 +112,8 @@ "name": "tat_exon2", "start": 1746, "end": 1824, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.7616257781032589, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", @@ -112,25 +124,13 @@ "name": "rev_exon2", "start": 1747, "end": 1927, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.7620186257236345, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", "aminoacids": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", "nucleotides": "GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA" - }, - { - "name": "vpu", - "start": 1748, - "end": 1778, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.7688723205964585, - "protein": "MHPEYYKDC", - "aminoacids": "MHPEYYKDC*", - "nucleotides": "ATGCATCCGGAGTACTACAAGGACTGCTGA" } ], "MN691959": [ @@ -175,9 +175,9 @@ "start": 5408, "end": 5699, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.5391891891891883, + "distance": 0.09157509157509158, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", "aminoacids": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG" @@ -186,8 +186,8 @@ "name": "tat_exon1", "start": 5679, "end": 5898, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", @@ -198,44 +198,44 @@ "name": "rev_exon1", "start": 5818, "end": 5899, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5910, + "end": 6156, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.7333193453629878, + "protein": "MQPIQIAIVALVVAIIIAIVV", + "aminoacids": "MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*", + "nucleotides": "ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG" + }, { "name": "env", "start": 6070, "end": 8656, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.13638128518734216, + "distance": 0.1405525502318391, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", "aminoacids": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*", "nucleotides": "ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA" }, - { - "name": "vpu", - "start": 6105, - "end": 6156, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.2321981424148607, - "protein": "MGVEMGHHAPWDIDDL", - "aminoacids": "MGVEMGHHAPWDIDDL*", - "nucleotides": "ATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8237, "end": 8333, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6672629695885509, "protein": "RPTSQTRGDPTGPKE", @@ -246,8 +246,8 @@ "name": "rev_exon2", "start": 8238, "end": 8514, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.210025203024363, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", @@ -258,10 +258,10 @@ "name": "nef", "start": 8657, "end": 9278, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.08588605782994552, + "distance": 0.06582796957284964, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", "aminoacids": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA" @@ -272,10 +272,10 @@ "name": "nef", "start": 0, "end": 4059, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.763072203234748, + "distance": 0.7628009106462086, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", "aminoacids": "WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*", "nucleotides": "TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG" @@ -284,26 +284,14 @@ "name": "env", "start": 2, "end": 4115, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.7604257801108195, + "distance": 0.76033143808071, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", "nucleotides": "GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA" }, - { - "name": "vpu", - "start": 2, - "end": 2084, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.7659115426105717, - "protein": "MGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ", - "aminoacids": "EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*", - "nucleotides": "GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAA" - }, { "name": "gag", "start": 789, @@ -345,9 +333,21 @@ "start": 3617, "end": 4115, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.7635778016363703, + "distance": 0.7629151983204618, + "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", + "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", + "nucleotides": "ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA" + }, + { + "name": "vpu", + "start": 3617, + "end": 4115, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.7634058115037564, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", "nucleotides": "ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA" @@ -356,8 +356,8 @@ "name": "tat_exon1", "start": 3823, "end": 4084, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7659115426105717, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -368,8 +368,8 @@ "name": "rev_exon1", "start": 3823, "end": 4084, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.7610789980732178, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -380,10 +380,10 @@ "name": "tat_exon2", "start": 4080, "end": 4164, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", - "distance": 0.7699443413729128, + "distance": 0.769292994661058, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", "nucleotides": "ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA" @@ -392,8 +392,8 @@ "name": "rev_exon2", "start": 4081, "end": 4153, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.7667894365645325, "protein": "YPVASPQMLHISSCFLPVLGLSG", @@ -443,9 +443,9 @@ "start": 5547, "end": 5838, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.587876570313453, + "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", "aminoacids": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG" @@ -454,8 +454,8 @@ "name": "tat_exon1", "start": 5818, "end": 6037, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -466,44 +466,44 @@ "name": "rev_exon1", "start": 5957, "end": 6038, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 6049, + "end": 6298, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.520618556701031, + "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", + "aminoacids": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*", + "nucleotides": "ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 6212, "end": 8783, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.47520309038232134, + "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", "aminoacids": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*", "nucleotides": "ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA" }, - { - "name": "vpu", - "start": 6253, - "end": 6298, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.3649167733674775, - "protein": "MEMGHHAPWDVDDL", - "aminoacids": "MEMGHHAPWDVDDL*", - "nucleotides": "ATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 8364, "end": 8460, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -514,8 +514,8 @@ "name": "rev_exon2", "start": 8365, "end": 8641, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -526,10 +526,10 @@ "name": "nef", "start": 8784, "end": 9387, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.4049958673891082, + "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", "aminoacids": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*", "nucleotides": "ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA" @@ -577,9 +577,9 @@ "start": 4931, "end": 5222, "subtype_start": 5558, - "subtype_end": 5843, + "subtype_end": 5849, "orientation": "forward", - "distance": 0.6083541998634192, + "distance": 0.3808935556928146, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*", "nucleotides": "ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG" @@ -588,8 +588,8 @@ "name": "tat_exon1", "start": 5202, "end": 5421, - "subtype_start": 5830, - "subtype_end": 6046, + "subtype_start": 5829, + "subtype_end": 6045, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", @@ -600,44 +600,44 @@ "name": "rev_exon1", "start": 5341, "end": 5422, - "subtype_start": 5969, - "subtype_end": 6047, + "subtype_start": 5968, + "subtype_end": 6046, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG" }, + { + "name": "vpu", + "start": 5433, + "end": 5682, + "subtype_start": 6060, + "subtype_end": 6309, + "orientation": "forward", + "distance": 0.5244381020335356, + "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", + "aminoacids": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*", + "nucleotides": "ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG" + }, { "name": "env", "start": 5596, "end": 8158, - "subtype_start": 6224, - "subtype_end": 8795, + "subtype_start": 6223, + "subtype_end": 8794, "orientation": "forward", - "distance": 0.5139610675592354, + "distance": 0.5152420275849952, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", "aminoacids": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*", "nucleotides": "ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA" }, - { - "name": "vpu", - "start": 5643, - "end": 5682, - "subtype_start": 6259, - "subtype_end": 6310, - "orientation": "forward", - "distance": 0.5690703735881842, - "protein": "MGHDAPWDVDDL", - "aminoacids": "MGHDAPWDVDDL*", - "nucleotides": "ATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG" - }, { "name": "tat_exon2", "start": 7739, "end": 7835, - "subtype_start": 8376, - "subtype_end": 8469, + "subtype_start": 8375, + "subtype_end": 8471, "orientation": "forward", "distance": 0.6842105263157894, "protein": "RPSSQPRGDQTGPKE", @@ -648,8 +648,8 @@ "name": "rev_exon2", "start": 7740, "end": 8016, - "subtype_start": 8377, - "subtype_end": 8653, + "subtype_start": 8376, + "subtype_end": 8652, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", @@ -660,10 +660,10 @@ "name": "nef", "start": 8159, "end": 8813, - "subtype_start": 8796, - "subtype_end": 9417, + "subtype_start": 8795, + "subtype_end": 9416, "orientation": "forward", - "distance": 0.49485619884358334, + "distance": 0.4891015417331206, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", "aminoacids": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*", "nucleotides": "ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA" diff --git a/util/subtype_alignments/all.fasta b/util/subtype_alignments/all.fasta index 7e414f3..f1ff126 100644 --- a/util/subtype_alignments/all.fasta +++ b/util/subtype_alignments/all.fasta @@ -1018,72 +1018,72 @@ CCACCTTTGCCTAGTGTTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACC AAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGA ATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATG AAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGC -TGTTTATCCATTTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGG -AGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCA -GCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTG -TTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAG -AGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGT -AACGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAAT -AGTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGA -CAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGA -AATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGA -TGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGA -AGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTAC -ATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTAT -TGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATG -AGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCT -GTGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGA -GAATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAA -GAGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATA -ATGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTC -CAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTC -TAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTAC -AATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAG -CAGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAG -TACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAA -GAATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATA -TGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAG -CTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAG -GAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTA -ATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAA -ATAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACA -TGTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTT -CATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCG -AGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAAT -ATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGG -TGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAG -CAGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGT -CTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGT -TGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGAT -ACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCA -CTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACA -CGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAA -TTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAAT -GGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCA -TAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGA -ATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGG -GACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCA -TTCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCT -TCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGG -GACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGG -AACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGA -CAGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAA -GAATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGT -AGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAT -AGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACA -GCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTT -CCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGC -CACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGAT -ATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTAGCAGAACTACACA -CCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTT -GAGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTG -AGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGC -CTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACAT -CGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGG -ACTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGG -GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACT -GCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTG -TGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA +TGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGGA +GAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAG +CCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGT +TTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGA +GCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGTA +ATGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATA +GTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGAC +AGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAA +ATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGAT +GATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAA +GGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACA +TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATT +GGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGA +GGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG +TGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGAG +AATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAG +AGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATAA +TGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCC +AAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCT +AAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACA +ATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGC +AGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAGT +ACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAG +AATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATAT +GAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAGC +TAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGG +AGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAA +TTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAA +TAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACAT +GTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTTC +ATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCGA +GATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATA +TAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGT +GCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGC +AGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTC +TGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTT +GCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATA +CCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCAC +TGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACAC +GACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAAT +TGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATG +GGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCAT +AATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAA +TAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGGG +ACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAT +TCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTT +CAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGG +ACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGA +ACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGAC +AGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAAG +AATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGTA +GTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATA +GGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAG +CAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTC +CAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCC +ACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATA +TCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACAC +CAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTG +AGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGA +GCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCC +TAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATC +GAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGA +CTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG +TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTG +CTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGT +GACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA >Ref.B.NL.00.671_00T36.AY423387 GAGCCTGGGAGCTCTCTGGCTAGCTGGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGC CTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTATGTGACTCTGGTAACTAGAGATCCC diff --git a/util/subtype_alignments/all.fasta.nin b/util/subtype_alignments/all.fasta.nin index a4e1369..38141ba 100644 Binary files a/util/subtype_alignments/all.fasta.nin and b/util/subtype_alignments/all.fasta.nin differ diff --git a/util/subtype_alignments/all.fasta.nsq b/util/subtype_alignments/all.fasta.nsq index 57ab1d4..8a5b270 100644 Binary files a/util/subtype_alignments/all.fasta.nsq and b/util/subtype_alignments/all.fasta.nsq differ