From 775c1d18a094001ebdace50a0cd4285366c102a2 Mon Sep 17 00:00:00 2001 From: Xiao Chen Date: Thu, 6 Apr 2023 20:50:16 -0700 Subject: [PATCH] Phasing and variant calling improvements (#4) * improve phasing and handle homozygous case * better handle homozygous case * update rccx --- paraphase/__init__.py | 2 +- paraphase/data/ncf1/ncf1_config.yaml | 7 +- paraphase/data/ncf1/ref.fa | 1404 ++++++++++++++++++-------- paraphase/data/ncf1/ref.fa.fai | 2 +- paraphase/data/neb/neb_config.yaml | 2 +- paraphase/data/pms2/pms2_config.yaml | 2 +- paraphase/data/pms2/pms2_ref.fa | 1312 ++++++++++++++++-------- paraphase/data/pms2/pms2_ref.fa.fai | 2 +- paraphase/data/rccx/rccx_config.yaml | 2 - paraphase/data/strc/strc_config.yaml | 2 + paraphase/genes/cfc1_phaser.py | 5 +- paraphase/genes/f8_phaser.py | 4 +- paraphase/genes/ikbkg_phaser.py | 49 +- paraphase/genes/ncf1_phaser.py | 11 +- paraphase/genes/neb_phaser.py | 6 +- paraphase/genes/pms2_phaser.py | 11 +- paraphase/genes/rccx_phaser.py | 13 +- paraphase/genes/smn1_phaser.py | 8 +- paraphase/genes/strc_phaser.py | 68 +- paraphase/genome_depth.py | 10 +- paraphase/phaser.py | 458 +++++++-- paraphase/prepare_bam_and_vcf.py | 53 +- setup.py | 2 +- 23 files changed, 2413 insertions(+), 1022 deletions(-) diff --git a/paraphase/__init__.py b/paraphase/__init__.py index 29c8335..9aa3f90 100755 --- a/paraphase/__init__.py +++ b/paraphase/__init__.py @@ -1 +1 @@ -name = "paraphase" +__version__ = "2.1.0" diff --git a/paraphase/data/ncf1/ncf1_config.yaml b/paraphase/data/ncf1/ncf1_config.yaml index ec43783..5460521 100644 --- a/paraphase/data/ncf1/ncf1_config.yaml +++ b/paraphase/data/ncf1/ncf1_config.yaml @@ -11,14 +11,11 @@ data: coordinates: hg38: nchr: "chr7" - nchr_old: "chr7_74768800_74792800" + nchr_old: "chr7_74760000_74820000" nchr_length: 159345973 extract_region1: "chr7:74769011-74792315" extract_region2: "chr7:73215625-73238945 chr7:75153639-75176964" - pivot_site: 74777266 + pivot_site: 74777265 left_boundary: 74769011 right_boundary: 74792315 - - #mutli-alleleic site - noisy_region: [[74783765, 74783765], [74781743, 74781743], [74776715, 74776718], [74780432, 74780432], [74778377, 74778377]] \ No newline at end of file diff --git a/paraphase/data/ncf1/ref.fa b/paraphase/data/ncf1/ref.fa index cb957fc..53341c1 100644 --- a/paraphase/data/ncf1/ref.fa +++ b/paraphase/data/ncf1/ref.fa @@ -1,402 +1,1002 @@ ->chr7_74768800_74792800 -GCGGCGGGGTGCAGGGGGCCCTTCCTATTAGCACTCGGGACGTGGGGGAATTCTTGGGGC -CCTGGTATTGTTCTAACACCCAGTGATGGTTCACCAGCTGTCTCCTTTATAATAATTAGG -TAAGAGATGTGGTTTTCTACATATTTCACAATACAAACATTTTTAGAAATTCTATTTCCT -TCCCCTGAAAAAACTCTCTTATCTCTTTATTACTTCCTTCCTTAACTTTATTTTATTTTA -TTTTATTTATTTATTTTTTGAAACCAAGTCTACTCTGTTACCCAGCCTGGAGTGCAGTGG -TGTGATCTCGGCTCACTGCAACCTCTGCCTCCCAGGTTCAAGCGATTCTTCTGCCTCAGC -CTCCCAAGTAGCTGGGATTATAGGCTTGCAATGCCATGCCTGGCTAATTTTTTTATTTTT -AGTAGAGACCCGGTTTCACCGTGTTGGCCAAGCTGGTCCCGAACTCCTGACCTCAGATGA -CCCACCCACCTTGGCCTCCCAAAGTGCTGGAATTACAGGCATGAGCCACTGCACCTATCT -TTTTTTTTTTAATTAAAAAAATTATTTGGTACCTTGTTTCATCCATGCATTAAATTAAAT -CCTGGCCAGACACAGTGGCTTATGCCTGTAATCCCAGCATTTTGGGAGGCTGAGGTGGGA -GGACCACTTGATACTGGAGCTTGAGACCAGGCCGAGCAGCATCTCGAGACCCCGTCTCTA -CAAAAAAAAAATAATAATAATAATAATAATAAATAAAAAGTGGAAAAAATCCTATGTCAT -CCTGAAAAAAGGCTGTAAGCCTGCTTACAGAGGTCATTACAAGGTCAAACTCAAGTTCGG -AGCGCTTCCTGCCTCTGCTCATCCAACAAACTTGCTGGATACCTCCTGTCTGCAGAGCAC -TTTGAGGGAACATAACAGGGTCTTGGGAGGCCACAGGAGGAGAGTTGAAAGATCACAGCC -AGGGGCTCAGGGTGTCCACAGGACAAGTACCCTTGGCCAGGCAGTTACGCAAGTGTGGAA -AGACTGCTAGAGGAAGGGAAGGAAGTGCCGAGAGCCCACAAAATTCTCTGCTTACAACCA -GCCCCACTAGAACCTTCCTCTGCCCTGCCTCGACATGCCCAGGAGAGCACCGCTGCAGGT -CTGGCCTCTGTGCTGAGCCTTTTTTTTTTTTTTTTCCTGAGACAGAATCTCACTCTGCTT -CCCAGGCTGGAGTGCAGTGGCAGGATCTCGGCTCACTGCAACCTCCACCTCCCTGGTTCA -AGTGATTCTCCTGTCTTACCCTCCGGAGTAGCTGGGATTACAGGTGTGTGCCACCATGCC -CAGCTAATTTTTGTATTTTTAGTGGAGACTGGGTTTCACCATGTTGGGCCAGCTGGTCTT -GAACTCCTGACCTCAGGTGATCCGCCCACCGTAGCCTCCCAAAGTTCTGGGATTAGAGCT -ATGAGCCACCATGCCTGGCTACCGTGCTGGGCCTTTCGAGGAGGCATTTGACAGGGAAGA -TGAGAGACAAATTGAGTGTCAGGGAAGGGGTGTTGATAGAAAAATTACAGGAGAGCACAC -AACTTTCAGCGGGTGAGCCCAGTGCCTGAGCTGCGGGACCACCCTACCAATGACCTTGAA -CTTATCTGACTGCAGCCTTGAACTCCTGAGCTCAAGGAGTCCTTCTGCCTCAGCCTCCTC -CCAAGTAGCTGGGACTACTGGCACATGCCACCATGCCCAGCTAATTATTTTATTTATTTT -ATTTTATTTTATTTTATTTTATTTTATTTTGAGATGGAGTTTTGTCCTTGTTGCCCAGGC -TGGAGTGCAATGGTGCAATCTCAGCTCGCCGCAACTTCTGCCTCCCAGGTGCAAGCGAAT -TCTCCTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGCATGTGCCACCACGCCTGGCTA -ATTTTGTATTTTTAGTAGAGACGGGGTTTCACCATGTTGGCCACGCTGGTCTCGAACCCC -TGACCTCAGGTGATCCACCTGCCTCGGCCTCCCAAAGTACTGAGATTACAGGCATGAGCC -ACCGCACCTGGCCCCACTTGTGGAACTAGCATCTATCTGGAGAGGAGGCAAACATCGCCC -ACCACCTCCCGCTCTCTCCTGTCACCACTGTCCCCACCATCATTCCAGAGGTCACCCTGG -CTTCCAACACCACAGCCTGGCTTGGGCAGTTTTCAAGCCTCGTATAAATGACATCCTCCA -GAACATGTGCTCTGTGCCTGCCTTCCTTCCGTCAGTGATGTATCTGGAAGATTCCACTGT -GTCGCCCTGTGGGACAGGTCCTTGTCATTGCTGAGTAGATCCTGTTGCAAATGCCTATCT -CTCTTCATGGAAAGATCCAAGATACACAGATGGAAATCATCATAGGAAGGGCTGGCAAGG -CCGTTCACACCCAGGGCTGGGGACCTCAGGGTGGAGGTGGGGGACAGTAAGGACCAGAAG -GAGCAGGTGCCGGCGGGTGATGTGAGCTTTCTTCTCTATAGAGAAGTGAAGGCCGGGTGC -AGTGGCTCACTCCTGTAATCCCAGCGCTTTGGGAGGTCGAGGCGGGCAGATCACTTGAGG -TCAGGAGTTCGAGACCAGCCTGGGCAATTTGGTGAAACCCCATCACTATAAAAATACAAA -AAATTAGCCGGACATGGTGGTGCACGCCTGTAATCCCAGCTATTTGGGAGGCTGAGGCAG -GAGAATTGCTTGTACCCGGAAGGTGAAGGTTGCAGTGAGCCGAGATCATGCCACTGCATA -CCAGCCTGGGGGACAGAAAGAGACTCTGTCTCAAAAAAAAAAAAAAGAAAAAAAGAAGTG -AAGCACTTGCCAAGCAAATCTTTCAGAGCAGGTGGAGTGGACCCTACACCTCTTGGATAA -TAAATGCACTGGATAATAAAAGCAGGAACAGGCCAGGTGCGGTGGCATGTGCCTGTAGTC -CCAACCTACTGGGGAGGCCAAGGCAGGAGGACTGCTTGAGCCCAGGAGTTGGAGGCTGCA -GTGAGTTATGACCAGGCAACTGCACTCCAGCCTGGGTGACAGATAGAGACCCTGTCTTTA -AAAAAAAAAAAAAAAAAAAAAGGGCCAAGCACAGTGGCTCATGCCTGTAATCCCAACACT -TTGGGAGGCTGAGGTGGGTGGATCTCCTGAGCTCAGGAGTTCAAGACCAGCCTGGCCAAC -AGGGTGATACCCCTTCTCTACTAAAAATACAAAATTAGCCAGGCGTGGTGGCGCACACCT -GTAATCCCAGCTACTTGGGAAGCTGAGGCAGGAGAATCGCTTGAACCTGGAAGGCAGAGG -TTGCAGTGAGCCGAGATTGTGCCACTGCACTCCAGCTTGGGCAACAAGAGCGAAACTTCG -CTTCAAACAAATAAATTAACGCCCAGCATGTCTTGGCTTTCATCTGCCAGACCTCAACCC -TCACCCCCAGGAGATCAGGTCCGGACCATGAGCTGACCCTGGACTCAGGCAAGGGTGAGT -TGGTGCAGCCCTGGCCTGCTGGGAGGCACAGGCTGCAGCAGGCTGCCTGGGGCTGAGGCC -CGCCACTCATGAACTCATGACCTTGAATGAGCTCCAAAAGCTCTGGGCCTCCCAGGCTCT -AGGGGGAGTGGGAGAGAGAGGCCTCAGCCTGTCCCTGGGCATGCTGCCCCCTCCTCACCT -CTTTGTCCCAAATCCCCTTCCTGGCAAAGCTGACAGTCTTAATATCACTCTGGAGAAAAC -TGAGTCAGCCCTAAGGAACAATTCAATGAACCATTTGCTTACTTGAGGATTGGAACTCAA -GTCTCACTCAAAGTCTGTGCCATTTTCGTCCCAGCTGTCACTGGCCCTCATCCACACACA -CCCAAGGATGAGCATCTAACGCTTGCATGCACACTCCCATGCCCGCGTTCATTCACTCAT -TCATTCATTCATTCACTCATTCATTGACTCATTCATTCATTCACTCACTCATTCATTCAC -TCAGTGAATGTTGCAGTCACGATCCAAATATTTATGGCCTCTGTGTGCCAGGCACTAGAT -GGAGGGGCTGGGGCTAGAGCCCCTGATAACCCGGTCATGCCCTAGCTTTCCTGGGACACA -CATTGTGGTAAGGGGAGACTAAAAAAATTAAGTCAGGCCAGGCACGGTGGCTCATGCCTG -AATCCCAGCACTTTGGGAGGCCGAGGCGAGTGAATTACCTGAGGTCAGGAGTTCAAGACC -AGCCTGGCCAACATGGAGAAACCCAGTCTCTAATTAAAAAAAAAAAAAATTAACCAGGTG -TGGTGGCACATGCCTGTAATCCCAGCTACTCAGGAGACTAACGCAAGAGAATTGCTTGAA -CCCAGGAGGCAGAGGTTGCGGTGAGCCGAGATCGCGCCATTGCACTCCAGCCTGGGAAAC -AAGAGCGAGACTCCATCTCAAAAAAAAAAAAGTGGGAGGCAGAGGCAGGAGGATCACTAG -AGGCCAGTAGTTTGAGACCATCCTGGGCAACATAGCAGGACCCTGTCTGTACAAAAAAAT -TAAAAAAAATTTAACCGGGCATGGTGGCACACACCCGTAGTCCCAGCTACTCCAGAGGCT -GAGGCAGGAGGATCGCTGGAGCCCAGGAGTTGGAGGCTGCAGTGAACTGTGATCCCACCA -CTGCACTTAAGCCTGGATAACAAAGCAAGACCCTGTCTCAAATAACAATAGCAATAATAA -TAAAGAAAAATTAAATGCAATTTGCGATGCATCAGTGATAAGTGCTCTGCAGAAAAAGGA -GGCAGGAAGAGGCTGAGAAAGGTATGAGGTTTGCTATGCAATGTGAAGTTATCAAGGAAG -GCTTCTCGGAAGAGGTGACATTTGAGCAGAGAAATGGAGGAGAGTTATGGAGGGAAGATG -GTGAATGGGGGGAACATGGTCAAGACCAGGAATATGGTCAAGGGGGGAAAGATGGTCAAG -GGGACGCAGCAAATGCAAAGGCCCTGAGGCAGGAGCAGCTTGATTCACCCCCAAAACCCG -TGGGGCCCGTGCAGGCGACGGGAAGGACAAGTGTAAACCCTTTTCCTTGTCCCTGCAGGT -GTGTGTGAACATGAGTCTGCCCATGTTTACACCCTGCAAGCCTGAAGAGTCCCCAGAAAC -TGAAAGAAGAAGCAAAGCCCTTTCTGTACCCTCCCTGCCCCCTGTCCCGACCGCGACAAA -AGCGACTTCCTCTTTCCAGTGCATTTAAGGCGCAGCCTGGAAGTGCCAGGGAGCACTGGA -GGCCACCCAGTCATGGGGGACACCTTCATCCGTCACATCGCCCTGCTGGGCTTTGAGAAG -CGCTTCGTACCCAGCCAGCACTATGTGAGTAGCTGGTGGAGGGCATCCCGTGGGGGGAAT -ACGGGAGGGACAGCACGGCCACCCTTGCAGTCCCAGGGCCAACCAGCTCCAGTGAGGACT -AACGGGGCAGGGTCTTGGGCACCTGGTCCCTGGTCTTTGAGCCTGGATCTACCCCTCTGA -TCCCTGGGAAGACAGTTCCCTTGGACCCGCCCTGGGCCCCAGCCCTTTACTGTCCCCGCC -TGTGTCCCCAGCCAGGCCCTCAGCCTTAGCCAGGAGTCCTCTTTCTGCTCCCCTGCCATG -GCCAGGCAGCCCAGCGCTCTCTCAGGTCCGAGGCCCACTCCTCCAGGAAGCCTTCCCTGA -CTAGCCCAGCTATCAGAGAGTGGCCCTCCCAAGAGGGAGGCCTGGAAACTAAAGCTCTCT -CTCTCCCCAGCTGCCTGTAGTGTCAGTTAGAGTCTTATCCTCTCCAGTAGGGTGACACCA -TGACAGGGGCCAATAGAGTCCTCCCATCTGTCCCCAAGGAGGCTGGACAAATGCCTGCTC -AGACACACAAGTCCACTGGGTCCCCTAATCCCATAGGAAGGCCAGGGAGGAACTACATTT -AGGAAATTGAAGCTTGTATGGAACATTTAGTCCTATGTGCCAAGACCTTTCTCTTTTTTG -TTATTTTTTTGTTTTTTGAGACAGAGTCTTGATCTGTTGCCCAGGCCAGAGTGCAGTGGC -ACGATCTCAGCTCACTGCAACCTCCGCCTTCCAGGTTCAACTGGTTCTCCTGCCTCAGCC -TCCAGAGTAGTTGGGATTACAGGTGCCCACCACCACGCCTGGCTAATTTTTGTATTTTTA -GTAGAGACAGGGTTTCACCATGTTGGCCAGACTGGTCTCAAACTCCTGACCTCAAGTGAT -CCACCCACCTGGGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACCGTGCCTGGCCT -GTTTTTTTGAAATGAGGTCTGGAGTGCAGTGGTGCGATCATAGTTCACTGCAGCCTCGAC -CTCCCAGGCCCAAGTGATCCTCCTGCCTCAGCCCCTTGAGTAGCTGGGGCTACAGGCGCA -CACCACCATGCCTGGCTAGTTTTTAAAATTTTTGTGGAGATGAGGTTTCACTATGTTGTC -CAGGCTAATCTTGAACTCCTCGGCTTAAGCAACCCTCTGGTCTCAGCCTCCCACAGTGCT -AGGATTACAAGCGTGAGCTACCGTGCCTAGTCACTTTTCTCCTTTTCTTTGTAACTTTCA -GTTTTGAAATTTCAAATTTACAGAAAGGCTACTGGGTGTCAAAACGGTACCAGTCACTCC -AATAGTCTTTCACTCACCTTCATCCACACCTCTCTTTCTGGGGATATTTTCTGAATTATT -TGAGAGTGAGTTGAAGACGTGTTTCTTTACCTCTAAATACTAGTTGTTGGGCATTTCTTA -AAATCAAGGCATTCTCTTACATAATCACAACACACGTGTCAAAATCAGGAAATTAACATG -GACAAAACACCATTATCCACCCACAGACTTTACTGAGGTTTCCCCGATTATCCTGCTTGT -CCTCTGCAGTGAAAACTTTTTTCAGGTCTAGGATCCAGTCAAGGATCAATGTCATAGCCT -TTAACCTTCTTTAATCTGGATCAGTCTTTTTTCTTTTTCTTTTTCTTTTTTTGGACACGG -AATCTCACTCTGTCGCCAGACTGGAGTGCAGTGGTGCAATCTCGGCTCATTGCAACCTCT -GCCTCCTGGGTTCAAGAGATTCTCCTGCCTCAGCCTCCTGAGTAGCTGGGAATACAGGTG -CGCGCCACCATGCCCAGCTCGCATTTTTTGGTAGAGACAGGGTTTTGCCATATTGATTCT -GGATCAGTCTTTTTTTTTTTTTTATGAGATGGAGTCTTACTCTGTCACCCAGGCTGGAGT -GCAATGGCACAATCTCCACTCACTGCATCCTCCGCCTCCCAGGTTCAAGCAATTCTCGTG -CCTCAGCCTCCCGAGTAGCTGGGATTACAGGCATGCGCCACCATGCCCGGCTACTTTTTG -TATTTTTAGTAGAGACAGGGTTTCACCATGTTAGCCAGGCTGATCTCGAACTCCTGACGT -CAGGTGATCTGCCCGCCTCGACCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTG -CCAGCGGATTCTGGATCGGTCTTAATCAGTCTTTGTCTTTTGCAACTTTGATGTTTTGCA -GAGAGCAGACCAGTTACCTTGTAGAATGTCCCTTAGTTTGGGTTTATCTTCATTAGATTC -AGTTTGTGTATCCAGGGCAGTGGATCTTAGATGCAATTCTGTCTTCTTTTTAATTTTTTT -GAGAGGGAGTCTCGCTCTGTCACCCAGGCTGGAGTGCAGTGGCACAACCTCAGCTCACTG -CAGCCTCCGCCTCCCGGGTTCAAGCAATTATCCTGTCCCAGCCTCCCAAGTAGCTGGGAT -CACAGGTGCCCATCACCACTACCGGGTAATTTTTGTGTTTTTAGTAGAGACAGGGTTTCA -CCATATTGGTCAGGCTGGTCTTGAACGCCTGACCTCAGGTGATCCACCTGCCTTGGCCTC -CCAAAGTGCTGGGATTACAGACGGGAGCCAACATGCCCAGCCTTCCTGCCCCTCCCGTCC -CCTCCCCTCTCCTCCTGTCCCCTCCCTTCCCCTCCCCTCCCCACCCAAGCTGGAGTGCAG -TGGTGCAATCATAGCTCACTAAAGCCTTGACCTCCAAGTCTCAAGCAATTCTCCTGCCTC -ACCTGGGGCCACAGGTGTGCGGCACCACACCCGGACAATTTTTGTGTTTTTAGTAGATAT -GGGGGTCTCGCTATGTTGCCCAGGCTGGTCTCAAACTCTTGGACTCAAGCGATCTTCCCA -CCTCGGTACTAAAAAGTGCTGGGATTCCAGGTGTGAGCCACCGTGCCCAGCCTAGGTCCT -ACTTTTATCTCCAATTTACAGATGAGTCCATTTGAGAGAAGCTGACCCTCTTGCCCTGGG -TCTCAAGGCTGGGGCGTGGCAGCACTTGGGTCCACGTTTGTGCCCTTTCTGCAATCCAGG -ACAACCGCAAAGATGGTCCTCACCCCAATCCTCTGGGCTTCCTCCAGTGGGTAGTGGGAT -CCTGGGTGCACACAGCAAAGCCTCTTTGGAGGCTGAATGGGGTCCCCCGACTCTGGCTTT -CCCCCAGGTGTACATGTTCCTGGTGAAATGGCAGGACCTGTCGGAGAAGGTGGTCTACCG -GCGCTTCACCGAGATCTACGAGTTCCATGTGAGTGTGGGGATGGAGGAGGGACAGGGACC -CACCGTTCCAGCTCCACCCTTTGGGAAGGACCTTAGCCCAGGTGATGGGGAAACTGCAGA -ACCCAGAATCCCCTCCCAGACCACAGTTAAAGGGGATTTATTTATTTATATAAATTTTTG -TGACAGGGTCTTGCTCTGTCACCACTCTGAACACCTCATGTTCTCTGATTACAGGCATGA -GCCCCCACGCTCGGCCTTTTAGGTGGTTTTGAGAGGTATTTAGGTTTGCAGTGCAGGGGC -GCAATCATAGCTCACTGCAGCCTCGACCTCTGGGGCTCAAGCGATCCTCCTGCCTCAGCC -TCCTGAGTAGCTGGGACTATAGGTGCGCATCACCATGTGTGGCTAATTTTTGTATTTTTT -ATAAAGATGGGGATCTCACTATGTTGCCCAGGCTGGTCTTGAACTCCAGACCTCAAGTGA -TCCTCCTGCCTTGGCCTCCCAAAGCTAAGGGGGCATTAAAAGAAAAAAACATTTTTCCCC -CTGAAACATTTAAGTAGTCTTACTGAAAACAATAAAACACAGAAACACCAGATTCTCATT -TTAAAGTAAAACAGACAGGATCTCCCAGAACCTTCCTAGAATGGAACCATTCTTGTCGCT -TTTGAAAAACAAAGCCAAGTTCTAGATCCCAAATAAATGCACCTGCTGGTGAACATTCTC -CTTGTGGTTCTCGTCCCTATGTTAGTTATTTTCCTAAATTTTACATTTGTACCTTTTTAA -GAATGAGTTATCAGTTTTTTTATATTTGCTTTTCTTTTGAGATGGGGTCTTGCTCTGTCA -CCCAGGCTGGGGTGCAGTGGTGCAATCACGGCTCACTGCAGCCTCAACCTCCAGGGCTGA -AGCGATTCTCCCATCTCAGCCTCCCATGTTGAGATCACAGGTGTGCACCACCACACCTGG -CTCCTTTTCCTGATTTGTTTTTTGTAGAGATGGGATTTCGCTATGTTGCCCAGGCTGGTC -TCTAACTCCTGGACTCAAGTGATCCTCCCGCCTCAGCCTCCCAAATTGCTAGGATTACAG -GTTTGAGCCCCTGCACCTGGTCAACCTGAGTTTTAAGAGGATCCCTTTGGCGACTGGATT -GAGGACAGACAAGAGTGGACGGGGGACACAAGGAGGCCATTTTCGTTATCCAGGCCTGGT -AGTGGCTAGGGCCAGGAGGGTGGGGTTGGTGGGAAGCAGTCAGATCCCAAAGAGATTTGG -GGATTGGAAGCAAAAGGATTTGCTGGTGACTTGCACATGGGAGGGAGAGAGGTCAGTGCC -TCTGCTAATCAAGGAATCCAGATTGCCACCGAAATTTCTAGGCCCGAGATATTTAGGTAG -TGTCTCACTCTGTCACCCAGGATGGAGTGCAGTGGCACCATCTCGGCTCACTGTAACCTC -CGCCTCCCAGGTTTAAGCGATTCTCCCACCTCAGCCTCCTGAGTAGCTGGGATTACAGGC -ATGTGCCACCACTCCCGGCTAATTTTTGTATTTTTAGTAGAGACGGGGTTTCACCACGTT -GGCCAGGCTGGTCTTGAACTCCTGACCTCAAGTGATCCACCCACGACAGCCTCCCAAAGT -GCTGGGATTACAGGCGTGAGCCACCATGCTCGGCCTTTTAGGTGGTTTTGAGAGGTATTT -AGGTCACTTCCAATCTCGTGCTTTTCCAAGTGTTGTAAACTACAAATATTCCTTCACGTC -TTCTTGTCTTTTTAATGTTTAGAAAACCTTAAAAGAAATGTTCCCTATTGAGGCAGGGGC -GATCAATCCAGAGAACAGGATCATCCCCCACCTCCCAGGTGAGCACGGGGCTGAGCCGCC -TGTCAGGGGGTCATTGGCGGGGGCTCACCTGCCCTCCCAGCCCCTCTCGGGCTTGACCTC -ATGTTCTCTGGTGCCAGCTCCCAAGTGGTTTGACGGGCAGCGGGCCGCCGAGAACCGCCA -GGGCACACTTACCGAGTACTGCAGCACGCTCATGAGCCTGCCCACCAAGATCTCCCGCTG -TCCCCACCTCCTCGACTTCTTCAAGGTGCGCCCTGATGACCTCAAGCTCCCCACGGACAA -CCAGTGAGTGAACTTTTCACCCTGCCAGGTGGGAGAGGGAAGGAGGGGTGGGACTTTCTG -TGTTTTGCAGATGAGGAAACCAAGGCTCAGAGAGGGAAAGCCACCTTCCCAGAGCCACAC -AGCCAGAAAGAGGAGGCAAATTCCACCTCCGGCCCCTGTGACCCCGCCAAGCCTCCACCT -TAATCTTTCACACCTCAGGGCACTGGGGGAAGCACTCGGGGCTGGAGGTTCAAAGTCCTG -GGTCCTCATCCTGACATTATGGCCACCTGGCCATGGGACCTGGAGCCAGTCACCACTGCT -CTCTGAATGCAGGTTCTCCATTTCTATAATGGGCAGTGAGGATCAGATGAAGCATTGGGT -GTCTTGCGGAGCCCCCCAGAAGGATGTGGGGTTGATGCCTCTGCTAAGTGCTGAGCATGT -CTGGGGTCTCCTGTACCCAGGACCCTGTGTGGAAGGCACCTGAGAGGCTGAGGGAGCTCC -AGGCAGGCTGGGGAAGTCCCCTTCTCCACTCCTCTCTGGTCACTGAAGCTCGAAGTGGGG -AGCATGAGGACAGGACGTTACCCCTTGTCAAGGCACCCAGGCTGCCAAGACAGAGACAAG -CAGCATTGCTCCGGCCAGCACTTATTGACGCTTGAAGGTGTCCCCTGGCCCAAGGAAGGG -CAGTTATCATCAGCCCGGGAGGCGGGGGAAGGATGGACTCTGCAGTGGGGTCCGCTCCTC -ATTGCCTGCTCTCTCAGGGCTCCAGAAGGAGGAAGAGGCCGGGCACAGTGGCTCACACGT -ATAATCCCAGCACTTTGGAAGGTCGAGGTGGGCAGATCACCTGAGGTTGGGAGTTTGAGA -CCAGCCTGGCCAACATGGTGAAACCCCATCTCTACCAAAAATATAAAAATTTAGTCAGGC -ATGGTGGTGTGCGCTTGTAATCCCAGCTACTTGGGAGGCCGAGGCAGGAGAATCGCTTGA -ACCCGGGAGGCAGAGGTTGCAGTGAGCTGAGACTGCGCCACTGCACTCCAGCCTGGGTGA -CAGAGCGAGACTCTGTCTAAGAAAAAAAAAAGAAAAGAAGAAAGAAGATGGCCTGGGAGC -CCGCAAGAGCATTTTCCAGGCTTAGGGCATCCTTTGGGTCTGCAGAAGGCTATGCAGTGT -CCTCCTCATGTCCCTCCCTTGGGCTGCCCGAGCAGATCCGCCCGCCCCCATCACTTCCTG -AAGCCCTTCCTCAGCCAGTCCAGTTGCTGTCTTCTCTCCGCAGTGCCCCTTCCCTTTCCC -GGGTCCCTCTTCTCTTGGGAAGTTCTTCTGCAGGTCTACCCAGTGCCTCTTCTTCCTCCA -TGGGAAGCCAAGGGTCTCACCCAGACTGTTCTCTCCTCAGGACAAAAAAGCCAGAGACAT -ACTTGATGCCCAAAGATGGCAAGAGTACCGCGACAGGTGAGAGGACGGGGGGCAGCCGGC -GGGGGGGGACACCCTGAGGAGACCCAGAGTGTTCAGGGAATGGAGCAGGGGCTGGGAGCA -GGCTGGGAGGGCTCACAGCTACCCTGCTGAAGAATTGGGTCTTTGGGCCGGGTGCGGTTG -CTCATGCCTGTAATCCCAGCAGTTTGGGAGGCCGAGGCAGGTGGATCACTTGAGGTCAGG -AGTTTGAGACCAGCCTGGCCAACATGGAGAAACCCTGTCTCTACTAAAAATCCAAATTAG -CCAGGCGTGGTGACAGGTGCCTGTAGTCCCAGCCACTTGGGAGGCTGAGGCAGGAGAATT -GCTTGAACCCGGAAGACGGAGTTTGCAGTGAGCCGAGATCGTGCCACTGCACTCCAGCCT -GGGCAGCAGAGCCAGACTCCATCTCAAAAAAAAAAAAAAAAAAAAAGAAGAATTGGGTCT -TTGGAAGGTCCCTGGAGACTGAAAGGAGCCCTTTGCAGGTGGCAGTGCAGAGACCAGCGC -AGACCCTTGCTACTGGCAGCCGGGGGAGTGTTTGCGGCTGAATGAATGAACAGGTTTTGG -AGGGCAGTGTGGCCTTCAGAGGCGATGCAGGGCTGTGGCAGTTTCTAATACTTATTGCAC -AGTCACTGCTAATAACAATAATAATAATAATACCTAACATTAATGGAGTGCTTACTCTGT -GCCAGCCACTATTTTGTTTTTGTTGTTTTCAGTGACAGGGTCTCGCTCTGTTGCCCAGGC -TAGAGTGAAGTGGTGTGATCATAGCTCACTACAGCCTCGACCTCCTGGGCTGAAGCGATC -CTCCCACCTCAGCCTCCCAAGTAGCTGGGATTACAGGTGTGTGCCACCATGTCCAGCTAA -TTTTTAATTTTCTGGTAGAGATGGGGTCTCACTACATTGCCCAAGCTGGTCTTAAGCTCT -TGGCCTCAAGCAACCCTCCTGCCTCAGCCTCCCAAAGTGCTGAGATTATAGACATGAGCC -ACTGTGCCCGGCTTTTTCTTCTTCTTATAAGGACACGAGGCCTGTTGGGTTAGGGCCCAC -TCTACTGACCTCATTTTAATTTAATTACCTCTTGAAACGTACTTAAGAGTACCTTTCTCT -TAATACACCCACACTGTAAGGTACTGGGTGGTTAGGACTTCAACATATGAATTTTGAGAA -GGCGGATGTCAGCCAATACTAAACAGCATCAGCACCTCCACGGTTGGATGAAGGGCTGGT -CAGAAATGCACACTCAGGTCCCACAGTGGACCTACTGAACAGGATAGGCATTTTAGCAAA -ATCCCAGGTATTCGGGTGCACCTTAAAGTTAGGAAAAGGTCAGGCACTGTGGCTCATGCC -TGTAATCCCAGCACTTTGGGAGGCCGAGGCGGTTGAATCACCTGAGGTCAGGAGTTCGAG -ACCAGCCTGACCAATATCGTGAAACTCCATCTCTACTAAAAATACAAAAATTAGCCAGGT -GTGGTGGCGGGTGCTTGTAGTCCCAGCTACTTGGGAGGCTGAGGCAGGTGAATTACTTGA -ACCTGGGAGGTGGAGGTTGCAATGAGCCAAGATTGCACCACTGCACTCCAGTGACAGAGC -GAGACTCCATCTCAAAAAAAAAAAAAAAAAAGTTGGGAAAAGGCCAGGTGCAGTGGCTCC -ACACCTGTAATCCCAACACTTTAAGAGGCTGAGGTGGGAGAATCCTTTGAGCCCAGGAGT -TCGAGACCAGCCTGGGCATTGTCCCAAGACCTTGTCTTTACAAAAAATTAGCCGGGTGTG -GTGGCATACGTCTATGGTCCCAGCTATTCGGGAGGCTGAGGCAGGGAGATTGCTTGAGCC -TAGGAGTCCAGGGCTGTAGTGAGCTGTGATCACGTCACTGTACTCTAGCCTGGGCAACAG -AGCAAGACTCTGTCTCCAAAAAAGAAAATAAAGTTGGGAAAGGCTCACTAACTTCATCAG -ATGAGAACAAGGACATGTTTGAAGTGTGAGGCCGAAGCCTGGAGAACGCTATGCGCCCAG -GAAATGCAGGGCAGCAGAGACTCAAGATGCCAGCGCCTGTTCTGGAGGCCCAGATGGGCC -CTGCAATGCCCACTCACCCTGCCCTCCCTCTTGCCCCAGACATCACCGGCCCCATCATCC -TGCAGACGTACCGCGCCATTGCCAACTACGAGAAGACCTCGGGCTCCGAGATGGCTCTGT -CCACGGGGGACGTGGTGGAGGTCGTAGAGAAGAGCGAGAGCGGTCAGACCTCCCACCTTA -CGGGGCTCCTTCCCCTGGTGCTCAGGAACCCACAGCCACAAGCCCCCTGCCAAGGCTCAG -GCAGCCTTGCCCCTGGGAGGACTCCGGCTCTGTTAGGGGCCCTAAATGTCCTCCCCACAC -TGTGGGTCGCCTTCTGTCTTAGTGTGCACCCTGTGGTGGCTGTGGGCATCTGTGCATGGC -AGGCCGGGGCGGGGCATGTCTGCGTGTTCTGTCTGGATGGGTATGGGACCGTCTGTTCAT -TATGAAGTGGGCTCAGAGCTGTGATTCTGTGAGCATGTGTGCATGCATGCATGTGACCTC -ATTGTCCAGTGTGGTGAAGGTGACATTTCCAAATCTGAGCATTGGACATCAGTGTGTCTG -TGTCCCTGTGTCCTCACCATCCCTGATGGCTGCAGGGAGCCGCTGGGCCCTGCCCCTCAG -TCACATTCCCGCACCTCTGGCACAGGTTGGTGGTTCTGTCAGATGAAAGCAAAGCGAGGC -TGGATCCCAGCGTCCTTCCTCGAGCCCCTGGACAGTCCTGACGAGACGGAAGACCCTGAG -CCCAACTATGCAGGTGCCCCCTGCCCTCCGAGGCTGTAGGGGTGTGGGAGAAAGGGGCAG -GCAGGGCTCAGGGATATTGAGTGACTGCTTTGGAGTCTGGGCTGGTTGCTGGCTTGGCAG -AAAAGTCAGGGCTAAGATCTCATCGACTCTGGCTTGGGGGCCCTGGCAGGTTGTGATGCC -CTTGGTCTGGACAGGGAACCAGGAGGAGGAGCAGACGACTGGGGAGAGTGGGAGGCCAGT -GGTGTCTGTGGATATGTGGCCAGGTTCAGTGGGAAGCTGAAGGATGAGCAGACCTTAGGC -TCAGGAAGGAGGGCTGCCTGGAAGTGGGGGCATCATCACTGACCAGAAAGGGAAAACTGG -CAGTGCCAGGGCTGGATGGGGCCTGCATTGAGCTTGAAAAAAACTATAATAGAATTGGTT -ACCATTTTATTTTATTATTTATTTATTTATTTTACTTTTTTGAGATAGAGTCTCACTCCC -TTGCTAAGGCTGGAGTGCGGTGGTGCTATCTCAGCTCACTGCAACCTCTGCCTCCCAGGA -TCAAGTGATTCTCCAGCCTCAGCCTCCCCAAGTAGCTGGGATTACAAGCATGCACCACCA -TGCCTGGATAATTTTTGTATTTTTAGTTGAGACGGGGTTTCACCAGGTTGGCCAGACTGG -TCTCGAACTTCTGACCTCAGGTGATCTGCCTGCCTTGGCCTCCCAAAGTGCTGGAATTAC -AGATGTGAGCCACTGTCCCTGGCCTGGTTACCCACATTTTAAAATGGAGTGATTTCACCC -TTTTATGTGGATTTACAGCTTTTTTTTTTTTTTTTGAGACAAAGTCTGGCTCTGTCACCC -AGGCTGGAGTGCAGTAATGCAATCTCAGCTCACTGCAACCTTAGCCTCCTGGGTTCAAGC -AATTCTCCTGCCTCAGCCACCTGAGTAGCTGGGATTACAGGCATGCACCACCACGCCAGG -CTAATTTTTTGTATTTTTAGTAGAGATGGGGTTTCGCCATGTTGGCCAGGCTGGTCTCGA -ACTCCTGACCTCAGGTGATCCGCCCGCCTTGGCCTCCCAAAGTGCTAGGATTACAGGTGG -GAACCACCTTGCCCAGCCTGTGGCTATCGTTTAAACACTGGGAAGGCCTGCAGCCCCCAG -GCCGACAGTTAGCTGCAGCTGAGCAGTTCCCAGTGCCAGGTAGACGGATGCTCCACCCAC -CTACTCATGGCTGATCTCTTGTCATAGTGAAGTGTCTGGACAGACCTTCATCGTTATGGG -ATCTCTGGTCCCCAGAGTGGGTGGCAATGAATGGGAGTGGACAAGCTCACCTGGGTGTAG -GGGGCAGAGGGCCGAAGTCCAGAGTGTACCCCCAGAGTGGGTGCCAGCAGGAGCTTGCCG -AGGGATCTGGGATGGAGCAGGAGGGTGGAGGGAGGAGACCCAGAAGAGGGGGAACTGTGG -GCCCTGGGTGGGTCTGGAGTGCCTGGAGGAAGCCCAGGCGCAGAGAGGAGAAGATGGGAT -GGGTGGCGAGCCCCAGGCTGGGCCGACCTCACACTGTGCTCTGTGCCCCTGCCGTGGACC -AGGTGAGCCATACGTCGCCATCAAGGCCTACACTGCTGTGGAGGGGGACGAGGTGTCCCT -GCTCGAGGGTGAAGCTGTTGAGGTCATTCACAAGCTCCTGGACGGCTGGTGGGTCATCAG -GTAGGAGGGCCCCTCTCCATCCAGAGCACCCATCTGAGTCAGCCCCAGCCAGGACGGGGT -GTTTAGGGATCTGGGGTGACTTGTCCCTGGGACTCTGGGTAAGCCACTGCCCCTCTCTGG -GCTTAGTTTCCATCTCAGTAGCAGGGAGGAATGAGCCCACCCTTGCCTGTCTTGTGGGGA -TCCAATGTCCTTGTCCAAGTGGGTGCATTTCTCCTTTGTGATTTAGGGTCTCTTCCCAAC -CATCTATTATTATTCCTTCTCTGGCAACATGGTGAACTGTTGTATAAATAATTACATTCC -TAGCTAGGCGCAATGGCTCAGGCCTGTAATCCCAGCACTTTGGGAGCCCAGGACAGGACG -ATCATGTGAGGTCAGGAGTTCGAGACCACCCTGGCCAACATGGCAAAACCCTATCTCTAC -TAAAAACACAAACATGAGCCGGGTGTGGTGGTGGGAGCCTGTAATCCCAGCTACTCGGGA -GTCTGAGACAAGAGAATCACTTCAACCCGGGAGGCGGAGGTTGCAGTGAGCCAAGATCGC -GCCATTGCACTCCAGCCTGGGCAACGAGAGCGAAACTCCGTCTCAAAAAAAAAAAAAAAA -AAAAAGATTACTTTCTTTTTATCATTCCTTTATCTTTTAAAGCTTTCTTGCAGTCAGGTG -CAGTGTCTCATGCCTGTAATCCCAACACTTTGGGAAGCTGAGGTGGGAGGATCACTCAAG -GCTACAAGTTCAAGACCAACCTGGGCAATGTAGGGAGACCTCTGTCTCTACAAAAAAAAT -TAAAAAATAGCTGGATGTGGTAGCACACACCTGTAGCCCCAGCTACTCAGGAGGCTGAGG -TGAAAGGATCACTTGACCCCAGGAGTTGGAGGCTGCAGTGAGCTATGACTGCACCACTGC -ACCCCAGCCTGGGTGATGGAGCAAGACCCTGTCTCAAAAAAAAAAAAAAAAAAAAAGCTT -CCATTGCAATTCCCATCTGTTTATCCTCCAAATGAATGCAGAAATACTAATTATCTTTTT -TCTGGTTCTGGGGAACACAGAATTCTAGCGGCTTGTGGAGCCATTTCCCTGGAGCCATGG -GGCCTCCCAGGTCCTTTCCTGTGTCTTCATTTTTTACGAATTTTTTCATTTTTTGAGACA -GGATCTTGCTCTGACTCCCAAGCTGGAGCACAATCATCGCTCACTCAAGCGATCCTCCCA -CCTCAGGCTCCCACGTAGCTGGGACTACAGGTGAGCACCACCACATCTGGCTAATGTTTT -TTAATTTTTTTGTAGGGATGGGGTCTCACTATGGTGCCAAGACTAGTCTTAAACTCCTGG -CCTCAAGAGTTCCTCCTGCCTTGGCCTCCCAAAGCACTGGGATTACAGGAATGAGCCTCC -ATGCTGGGCCTTTGCTGGCGTCTTCAGAGCCCTAGGTCACAGGGCCAGCCTGGCGCCCTG -CCGCAAGCTTATCTTAAAGCTGGGACCACAACATGCATACCTGCAGCCGGGCCCGGGGCC -AGAGGGCTTTGAGGCAGCATTTCTCAGCCTTTTAGACACACACTCTGTTAACCCCCATCC -TGTGTCTCTGATAATCTTCTTGTGATCCTCCCACCAGCCAAGAATTGGGTTTTATGTGAA -CCTTGTATTATGCAAAGTTTTCTTTTGTTTTTTTTTTCACTCCCAAATATAATATTGAGA -ATAGAAAGAAAGTCTTTTCAACAAATGGTGCTGGAACAGATGGATTTCCATACTGGAAAA -AAAAAAAAAAGAGCAAAAAACAAACCTAGACCCCTTCCTCACACTGTACACATATGTTTA -CTTCAGATGGATCACAGGTTTATCCCAGAGTAAAACCTGAAACTAAAAACCATTTGGGGC -TGGACAGGGAGCTCACGCCTGTAATCTCAGCACTTTGGGAGGCTGAGGCAGGTGGATCAC -TTGATGTCAGGAGTTTGAGACCAGCCATGACCAACATGGTGAAATCCTGTCTCTACTAAA -AAAATACAAAATTAACCAAGTGTGGTGGTGCATGCCTGTAATCCCAGCTACTTGGGAAGC -TGAGACAGGAGAATTGCTTGAACTTGGGAAGCAGAGGTTGCAATGAGTCGACATCATGCC -ATTGCACTCCAGCCTAGGCAACAAGAGCAAAACTCTGTCTTGGGGTTGGGCGGGGGAAAA -GCATTTGGAAGAAAGCATAGAATTTGGTGGCTTGGAGGTAGGCAAAGGTTCGTAGGAGAC -AGAAGGCAGTTAACATAAAAGAAAAATTGGCAAATATAATCCGCCAATGTCTTCTTTTTT -CTTTACTTTTTTCGGGAGGTAGAGATAGGGGTCTTGCTATGTTACCCAGGCTGATCTCCA -ACTCCTGGCCTCAAGCGATCCTCCCACCTAGATCCCTCAAAGTACTGGGATTACAGGCGT -GAGCGACCGTGCCCTGCCCATTCTTGCCAATGTCTTATAGCAAATACCTGTCCCCTGCGG -TGACCTGGATCTGCTAACCTCCACCCCTGCCTAGACTGTGGAAGGATTGCTGGAAGGGTC -TCAGTTGCACAGACCAGGAAACTGAGGCCCACAGAGGCAGGTGTCCGGTTGTTTGCAACC -TCTCAGCCTGTGCTAACCCCAATTGTTCAGAGAGAGCCCTGAAACCCTCTCCTCTGGGCG -CCCCCAGGTGACTGCCCCAGCCTCAAGGGCTGCCTCTGTTGCAGGAAAGACGACGTCACA -GGCTACTTCCCGTCCATGTACCTGCAAAAGTCAGGGCAAGACGTGTCCCAGGCCCAACGC -CAGATCAAGCGGGGGGCGCCGCCCCGCAGGTAAGCGGGGGTCCCCGGGGCTGGGCGGGGT -CGAGCGGGGCGCACCACGGGTTCGCTCTGTCTAGGCCATAGCTTGGCAGTGCCGGGGCGG -GGGCTCTCAGCCTGGCAGGAGAGGCAGGACCCTCACGGGGGAAAGGGGCTGGACGCGCCT -GGCCGCGGTGTGGGGCTGGCACGGGGGCGGAAGGAAAGCGGCGATGCCCGGGGGCTTTGG -GGATGGGCAGTCCAGGGGGGGTCCCCGGAGAGGGGGACGACAGACCGAAGGCTGGTGAGG -GGCGTGGAAAACCGCCCAGGCTCTGCTGCAGGGCAAGGGTCCTTGTCGTGACGGGGGCAG -CCGCCTCTTGTCCCGCCGGGGTCGTGCAGACTACCGGCCCCCTACTGCCCCCCACTTCCT -CGGACCAGGGGTGCCCATCTGAGTCCCTGGGGGCAGGGGCGCCCTCGGGCTTTGACGACG -CCCCGTCCCGCTGGGCCAGGTCGTCCATCCGCAACGCGCACAGCATCCACCAGCGGTCGC -GGAAGCGCCTCAGCCAGGACGCCTATCGCCGCAACAGCGTCCGTTTTCTGCAGCAGCGAC -GCCGCCAGGCGCGGCCGGGACCGCAGAGCCCCGGGAGCCCGCTCGGTGAGTGCAGCGGGA -GAGGGCAGGAAGGGCAAGCCCTAGAGGCGGAGTCAGCGGGAGAGGCGGGGCCAGAGGTAG -GGCCAGAGTAGCGGGGCGGGACCAGAGGGCGGAATCAGAGGGAGAGGCGGGGACTGGAGG -CGGGGTCAGAGGAGGAGCCAGCGCTAGGGGGCGGAGCGATCCCTAAGAGGCGGAGTCAGA -GGGAGAGGCACAAGCGGGAGGCGAGGCCAGAGCGCGGAGCAGGAGTTGGAGACCGCGGCG -GGGCGAGGCCAGAGAGCGCTGTGGGCGGGGCCAGTGTGCGGGGCGGGGCGTCTGACTCGG -CCCCGCTCTCTGCCCGCAGAGGAGGAGCGGCAGACGCAGCGCTCTAAACCGCAGCCGGCG -GTGCCCCCGCGGCCGAGCGCCGACCTCATCCTGAACCGCTGCAGCGAGAGCACCAAGCGG -AAGCTGGCGTCTGCCGTCTGAGGCTGGAGCGCAGTCCCCAGCTAGCGTCTCGGCCCTTGC -CGCCCCGTGCCTGTATATACGTGTTCTATAGAGCCTGGCGTCTGGACGCCGAGGGCAGCC -CCGACCCCTGTCCAGCGCGGCTCCCGCCACCCTCAATAAATGTTGCTTGGAGTGGACCGA -GGCTCTGCAGGAATGCAGGGAGGGCCGGGCTCCGCCCCAGGGTTATTTCTAAGTTGAGGA -CAGGAGGTTGTGAGTTCTGCTGGGGGGAAGTTGCAAGAGCCGAGGTCTGGTTGCATGTTG -CCCTGGTCTTGGCCAAGAACAGGTTTGCACAAGGCCAAGTTCAAGAGGAACTCCCGGTTT -CCTGCTGACCGTTTGGTCAGAAACCACCTGCTTGGACTCTGGCGGAAGAGTGCTGAAGAT -GGGTGCACACAGTGCAGCAGGGCAGCCCTGTCTCATGACAGGAGACAGGCTGCCGTCCAG -GGTGTAGGAGTGACCTCATAGCTGGGATAAAAAATATATTATAACTTAGGTTCGGGCGCG -GTGGCTCACGCCTGTAACCCAGCACTTTGGGAGACCGAGGTGGGAGGATCCGTTGAGCTC -AGGAGTTCGAGACCAGCCTGGCCAACATGGTGAAACCCCATCTCTACCAAAAATATAAAA -ATTAGCTGGGCGTGGTGGCATGCATCCATAATCCCAGCTACTGGGGAGGCTGAGGCATGA -GAATCGCTTGAACCGGGGAGGCAGATGTTGCAGTGAGCCGAGACGGCGCCACTGGACTCC -AGCCTGGACAACATGGTGAAACCCCATCTGTACCAAAAATATAAAAATTAGCTGGGCGTG -GTGGCATGCATCCACAATCCCAGCTACTGGGGAGGCTGAGGCATGAGAATCGCTTGAACC -GGGGAGGCAGATGTTGCAGTGAGCCGAGACGGCGCCACTGCACTCCAGCCTGGACTACAG -AGCGAGACTCTAGCTCAAAAAAAAAAAAAAAAAAAAGTAACTTAGGTGCAGGGTGTCCTC -TGTTATTCACTGAGACCGTGCCCCGGTTATGAGGTTGTACCAGAAAGCAAGTATTCACTA -TGCACACTATTCACCGCTCACCCTAGCATTGAAGCCAGCCTGTAGCCTGAAAGCCTTTGC -TTTGAGGGCAGGTCTTTCCCCAAAATGCAGACACGAAGGTGCAAAGTGAAGCTGCCAGTC -TTGCAAAAGATGTAACTTGTCACGAAGGCCACGAGTGGCAGGGAGAGCTGTCCCACATTT -GCGGAAGTGGCTATGTGAGGACGGGGGAGGCGGGTCCCTTAGAGATAAGAGACAATCATA -AGGGGAGATATCAGAGAAAATCGTAAGGGGAGCAGATGGTTGTCAAGAGAATAGGCTGAC -CATCGAAGGACTGGCAGAAGCTTTCAGAAAACCACTGGACGGCTGGGCACAGTGGCTTAG -GCCTGTAATCCCAGCACTTTGGGAGGCTGACGCGGGTGAATCACTTGAGGTCAGGAGTTC -CAGACCAGCCTGGCCAACATGGTGAAACCCCATCTCTACAGAAAATATAAAAATTAGCCA -GGCGTGGTGGCACAAGCCTAGAATCCCAGCTACTTGGGAGGCTGAGGCAGGCGAATGGCT -TGAACCCAGGAGTCAGAGGCTGCAGTGAGTCGAGAGTGTTCCACTGCACTCCAGCCTGGG -TGACAGTGCAAGACTCCTTCCAAAAAAAAAAAAAGAAGAAAAAAGAAAACCACTGCAGCT -CTAAACTAGTTCTGCATTTTTGCCGAACCTGGTTTGCTGGAAAAGCCCAGCACCAAAGGC -TATCATACAAAGCTGTGGGAAATTGAATCACCAACCTCACCCCTTCTGCTTGTTCAGTTG -CAGTTATAACCCTTTTATTAAATACAGTATAAAATACCACGCCTCTAATCCGAGTGCTCT -GGGAGGCCAAGGTGGAAGGATTGCTTGGGGCAGGGAGTTCAAGACCAGCCTGGGCCACAC -GGTGAGACCCATCTAGACAAACATTTTTAAAAATTAGACAGGTGTGGTGGTGTGCACCTG -TAGTCCCAGGCTGGGTGGGAGGATCGCTTGAGCCCAGGAGTTTGAGGCTGCAGTAAGCTG -TGATCGTGCCACTGTACTTCAGCCTGGGTGACAGAGCAAGACCCTGTCTCTAAAAAAAAA -ACAAATTAAGGCCAGCCACAATGTTTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAG -GCAGGCGGATGACTTGAGGCCAGGAGTTCGAGACCAGCTTGGCCAACATGGTGAAAGCTT -GTCTCTGCTAAAAATACAACAACAACAACAAAATTAGCCGGGTGTGGTGGTACACGTCTG -TAATCCCAGGTACTCAGGAGGCTGAGGCGGAAGAATCACTTGAACCCGGGAGGCAGAGGT -TACAGTGAGCCGAGATCACGCCACCACACTCCAGCCTGGGCGACAGAGCATGACTCTGTC -TCAAAAATAAATAAATAAATAAATAAAAATAAAAAAATACATACATATAAAAAAGAAGAG -AAAATACTTATTTTCATGATTGTTTCATTTTTTTCCAAGCTGAGGTCCTGACCAAATGTT -TCCCCGTGGTTTTTGTATATTTCTGATCCCCTTAAAGTGGCCCTTGCAGCGTGCTGGGGA -GGAGGCCTCTCGGTGGGTGGGTGATTGGGAAGCCACGCCCACAGGGAAGGGAGAAAAAAA -CTGAAGTTGCCTGCTCTAAGGGCTGCACCTCTGTTTAGCCAACAATTTTCTTGAGGCCAG -TCATAGTGCTGGGCTCATTCCATCATCTCCAGTTCTGAGACCAACACTGTCTGGTAGGTG -TTTTATGGATGAGGAAACCAAAGCTCATAAAATTAATTAAGTGGTTTGCTTATGAAATAA -TGCAAGAAAGCAACAGTGCTGGGAGGTGGAACCGGGTTTTTCTTTTCTTCTTCTTTTTTT -TTTTTTTGATGGAGTTTCGCTCTTGTCACCCAGGTGGAGTACAATGGAGCGACCTCAGCT -CACTGCAACCTCTGCCTCCCGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCGAGTAGCT -GGGATTACAGGTGCCCGCCACCCTGCCCAGCTAATTTTTTGTATTTTTAGTAGAGATGAG -GTTTCACCATGTTGGCCAGGCTGGTCTTGAACTCCTGACCTCAGGTAATCCGCCTGCCTT -GGCCTTCCAAAGTGGTGGGATTACAGGCATGAGCCACTGCGGCTGGCCCAGGCTTTTCTT -TTTGATTCTAAGGCCTTCCAGATCCAGTACTTTATCCTGACCCTGCAGAGCTCAGGATCT -GTGGTTCAGGCCTGCGGCTCAGAGGAGGGAATACGGCACACAGGTACGTGCCAGGCCAAG -TGTGAGGGGGTCTGGCTTCCAGGGCCCTCTGCAGACCCCTAGTCCCAGGGCCTGTGTTGG -AGGAGAGATTGGCTCTTTCCTCTGCCCATCCTGGGATGAGAAGTCGGGGACTTGGGATAG -ATGCAGTGCAATCCCTGCCCCTGAAAATTGACAAAGACCCACCAAATCTAGCCCCTACTC -CTAGGCTGGGCCCCTGCCCATCTCCCTGGACCACACCACTCTCAAGGGCTCTCGTTTGCA -GACACCCCATTGCCCTACTAAAAACCTCTCCTGGCCAGGCTTGGTGGCTCACGCCTGTAA -T +>chr7_74760000_74820000 +TCCTTAATGACTGAGTGAACAGTTCCTATCTGTATATTTGACTAAACCTTTTCCTAAGCT +ATCTCTCATGGTTCCTATGTTTTTTTATCATAATTAAAAGCAAAACCATCTGGATCACCT +AACAGTCAGAGGTCAGTATCTCAGCGTGTGAATTATAGAGGAAATACAGAGAGAACCTCT +TCCACTTTTACTTTTCGTCCAAATAAAATGCATGGTGTACCAGAAGTTGAAGATCGGGTT +GAGGATTGGGGCTAGCTCGATGACACTAAGGCCCCAACATCGCGGGACCTGCTGTGGCGC +GGATTCTTAGGAACGCTGTTCTAGCCGGCCCCCTCTCCAGGGGTCGCCGTGGCCGGCATT +ATTTCCTAGTTCTTCTTGTAACCCTGAGGTGCCAGCGCGGGGAGTGAGGAGGGGTCAGGG +GGCTAAGGATGCAACCTCTGACGTTCTGCGCCTTCCTAGGAGAGTCTTACATGTGTTGAG +ATTTCACAAGCAATGCGAGTTGTAAAATACCAGCTCTACAAGAAGCTAGGCTCTGTGACG +GCATAGTTTTCAGTAGCTTTATCACAATATTCACAATGGAGAATTATATGACATGGTAGC +AGAAATAGGCCCTTTTATGTGTTGCTTCTATTTTACCTCAAATTGTAGATATAGGGTAAT +CAATAAAATCCATCCATGCCTTTCACACACTAAGTCATTGCTCTCTCGGCTGTTTTCATG +GTCCTGTCTGGGGAAGCTTGGGGGTGGCTCGGCGTAGGTGGGACGCAGACCAAGGCCGAG +GCTGGCGCTGGGCAGAGCCCGCCGGGCCTCCCGGGGACAGCGCCACTTGCGGTGTTTCTC +AGACCGCTGCTGCCCATCTCCTCTGAGCGGGCCAGGGCCCCCACCCTTCCATCTGGGCCA +TGCCAGCTGTGTATGGAGAGCCGCTCACATACGACATTGGGTGCCAAAAGCCCCTGCCAT +CGAGAGCTCATGCAGCAGTCCCTCCTGCCTGAGCCCACACACTGACTCTGAGGCTCTTCT +GTTCTCAGCGTGGTCCCTGCCTCTGCCGTGCCCTATCCGCGTGTGCCAGAAAGGGAAACT +GATCTCATGATTCACCTGCCTGCTAACCTGGGAGGAGACTGCTTCTCTGATAGCATCTCA +CAGTTCTTTTAACATGTTCTTAAAATGTGTCCTGCCGCACCACCCTCAGCCACACCTCCC +AGCACCCATCCTGGAGAATCAGGGCCATGGCAAGGCTGCCGTTGGCAAAAGCCCAGCTCT +GCCATGAATCTCCGTTCAGTTACTGGTTTCACACTCATTTGTGAGGTCACAGACTTGCCA +AGGATATTCATGATTCAATCCATTACAACAATTCTGTGTGTACATAACACATTTTTTCCT +TTCTTTTTTTTTTTTCCTGAGACAGTCTTGCTCTGTTGCCCAGGCTAGAGCACAGTGGTG +CAGTCTCAGCTCACTGCATCCTCCACCTCACAGGTTCAGGCAATTCTCCTGCCTCAGCCT +CCCGAGTAGCTGGGATTGCAGGCACCCACCAACACACCTGACTAATTTTTGTATTTTTAG +TAGAGACGGGGTTTCAGCATGTTGGCCAGGCTGGTCTCAAAATCCTGGCCTCAGGTATAT +ACACATATTTTTACACACACACACACACACACACACACACACACACACACATAAAGGATT +TAAGCCAGGTGCTGTGGTGTACAACTGTAGTCCCAGCTACTAGGGAGGCTGAGGTGGGAG +GATCACTTGAGCCACTGCAGTGATTACACCACTGCACTCCAGACTGGGTGACAGTGAGAC +CCTGTCTCTTAAAAGAAAAAAGAAGAGGCCTTAGCTGCCTGCATTAATTAATGAACAGGC +AGTGTATTTCTGTTCTTTTTTTTTTGAAGACGGAGTCTCACTCTGTTGCCCAGGCTGGAG +TGCAGTGGCGCAATCTTGGCTCACTGTAACCTCCGCCTCCTGAGTTCGAGATTCTCCTGT +CTCAGCCACCCCAGTAACTGTGATTATGGCCACCTGCCACCACGCCCGGCTAATTTTTGT +ATTTTTAGTAGAGACGGGGTTTCCCCATGTCGGCCAAGCTGGTCTCGAACTCCCAACCTC +AAGTGATCCACCTGCCTCGGCCTCCCAAAGTGCTGGGATGACAGGTGTGAGCCACCAAAC +CCAGCCTCAGGCAGTGCATTTCTAAAAGGCAGATAGTGTGATTGTTCAGAGGGTGAAGGG +GAAGTTAAACTTGTCCAGTAAAATCTTCGTTAGCCCGGTATTCTGGATTGAAAAAGCAAA +ATATAGTTCAAGTAGGTCTCTTCAGTGTATCTAATAAGCTCTTGTTTCTGAAACAACTGA +TTCCTTGGCCGGGCGTGGTGGCTCACGCCTGTAATTCCAGCACTTTGGGAGGCCAAGGAG +GGCAGATCACTTGAGGTCGGGAGCTCAAGACCAGCCTGGTCAACATGGTGAAACCTCGTC +TCTAGTGAAAATACAAAAATTAGCCGACTGTGGTAGTGCACACCTGTAATCCCAGCTACT +CGGGAGGCTGAGGTAGGAGAGAATTGCTTGAACCTGGGAGGCGGAGGCTGCAGTGAGCCA +AGATCACACCACTGCACTACAGCCTGCGTGACAGAGTGAAACTCTGTCTCAAAAAAACAA +AAACCTCCTGATTTTTTTTTTTTTTTTTTTTTTTTTTGAGATGGAGTCTGGCTCTGTCGC +CCAGGCTGGAGCGCAATGGTGCGATCTCGGCTCACTGCAACCTCTGCCTTCTGGATTCAA +ACGATTCTCCTGCCTCAGCCTCCAGAGTATCTGGAACTACAGGCGCCTGCCACCACGCCC +AGCTAATTTTTTGTATTTTTAGTAGAGATGGGGTTTCACCATGTTAGCCTGGATGGTCTC +GATCTCCTGACCTCGTGATTTGCCCACCTCGGCCTCCGAAAGTGTTGGGATTACAGGCAT +GAGCCGCCACACCCGGCCGCCTCCTGATTTCATAATAATTCAAGGGACAAACATAATTAC +TTCCCAGGTAAGGCAGTAGAGTGACTAAGAACAAATCCACTTCTGGACAGCCATTATATA +GGGGACATTTTTATCAGAAAAACAGTAAAAGCAAGGAAATGTCTCCCTCCCAGGACTGTA +TGAATTAAACCCTGCCTGCTGATTGCCAAGTGACAACTCCCATTCCAAGCCCCTGGTCCT +CAGTGGGGAGGAAACCAAAGCTTTGTCCCTGGAGGGAGGTCCTGCGGGAATGGCCAGGGA +CGCATCCGCTCTCAAATGCTAGAGCTGGCAGTTGTCATCTGCTCGTGAGAAGGTTTCGCC +TTTGCCTGTCCCCACCCCCGTCCCTCCCAGGCCATCAGCGCACATCAGAGTTAGCACATT +ACATGATGCCTTAATCTTCTAATTGGTTTAAGTCAGCTGACATGTAAAGTGAGGTCTGGG +AGACTGTTCTGGAACTGTATAGATGAGGACGTTGTTGCCCCAGTCTTATTCAGAAGCTTG +AGGATGCAACTTGGACCTGGGTCTGTGGTCCCCTAGGACCTGAAACTCATATAGAGCCAG +CTGCCAGTTCCATTTTGAAGTAGGTTGGTCTCTCTCTCTCTTTTTATTTTTTGAGACAGA +GTTTCGCTCTTGTTGCCCAGGCTGGAGTGCAATGGCACGATCTCAGCTCACCGCAACCTC +CACCTCCCAGTTCAAGCGATTCTCCTGCTTCAGCCTCCCGAGTAGCTGGGATTACAGGCA +TGTGCCACCACACCTGGCTAGTTTTGTATTTTTAGTAGAGATGGGGTTTCTCCATGTTGG +TCAGGCTGGTCTGGAACTCCTGACCTCAAGCAATCCGCCCGCCCCAGCCTCCCAAAGTGC +TGGGATAACAGGCATGAGCCCCTGTGCCTGGCTGTAGTTTGGTTTTTCTGAGCCTCCTCC +TGGTTCCCATTTCTGTTTTTTTGTTTTTGTTTTTGTTTTTTCTCCAAAGACCAAAAGTTC +CACCAGAGAGGAAGATCGAGGGACCAGGCCTTTCTAGTTTCCACATTACACTCTAAGTGC +TGGTCTTAGTAAATTCAAGGCACCTGGTGGGCTTGACCATTCGGGGGCAGATAATTGTTA +CACACCAAAGGGGCATCTTTTGGAAAGTCACTGCCCAGTAACCACTTCCATCTTCTGGAA +GGTCGCTGCTCATCTTCCTAAATGGAAGCCCCAGTTTCTGGACTTGGATGTGTTTTGAGG +ATCTGATGTTCTCCCAAAGTGCCTCAGTTTCCCTATGATGGGGAAAGAGGAAGGGGACGG +ATTTTAGGAATGGAGGTGACCTGGAGGCCGCTGTCCCTGTCCTTAGACCTGCGAGTCCAG +GGGGATGACCGCAAACAGGGCTGTGGGGCCTTTCTTTACTCTCAAAAGCATCACTTCCCC +TGCCTGGAGTTCAGATCCTGCCTGGATCCACGGTGGGAAGGGAGCTCTGGCTCTCTGTAC +TTCACCCACGGCTGCCCACTCACCTGGCTCACAGGGCAGACTGGATGCAGCTTTCAGCCA +GTTGTAGAAATCACAGGTCCCTGGCTGGGAACAGTGACTCAGGCCTGTAATCCCAGCACT +TTGGGAGGCCGAGGCGGGCGGATCATGAGGTCAGGAGATCGAGACCATCCTGGCTAGCAC +GGTGAAACCCCGTCTCTACTAAAAATACAAAAAATTAGCCGGGCATGGTGCTGGGCGCCT +ATAGTCCCAGCTACTCGGGAGGCTGAGGCAGAATGGCGTGAACCTGGGAGGCCAAGCTGG +CAGTGAGCCGAGATCGCACCACTGCACTCTAGCCTGGGTGACAGAGCGAGACTCCGTCTC +AAAAAAAAGAAATCACAGGTCCCTAGGGGCCTAGTGGCCCATCGGTGACAAAGGGCAGGT +GGACCTGGTGTGGCTGCACCAGAGGGGCCTTCTCATCCTGGGAACTGGGCTAAAAACCAA +GCCCAGACTGAGGCCCATGCTTTTGTCCCCCCAGCCGCCTCGAGGTCCCTCCTTACCTGC +CCCCTGCACCCCTACCCCATCTTAACTCTTTTTTTTTTTTTCCAAGATGGAGTCTCGCTC +TGTGGCCCAGGCTGGAGTGCAGTGGTGCAATCTCTGTCCCCTGCAACCTCTGCCTACCAG +GTTCAAGCTATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGTGTCCACCACC +ACACCCAGCTAATTTTTGTATTTTTAGTAGAGACGGGTTTCCCCATGTTGGCCAGGTTGG +TCTCGAACTCCTGACCTCAAGTGATCCGCCTGCCTTGGCCTCCCAGAGTTCTGGGATTAC +AGGCGTGCGTGAGCCACTGCGCCTGGCACCGCACCTTAATTTTGAGGAAGTGTTGGGAAA +GCTGGCTCTGACATCTCTTGTGAGGCAAGCCCAGCTGGGGAAGGTGTTTCCTGCCTGACT +TCCTCCCCAGAAGCAATAGCAGGGCTTGCTGTGGCATCCGCTTCCTGCGGGGGCTCAAGG +TTGCTCGTTCCTCAGGCTACATAAAGCAGTAAGGACCCACCCAGGAGGACCCCTCCAGAG +GTGTGAGGGCGATTTGGTGGACACAGGTAGGGCCAGCGACAGAGCAGAGGGCACACCTCC +CAGAGCCCCAAATGCCACAGGCTGAGAAGGTCTAGCTCTAGCTGCATCCAAAGGACCTGT +TGAACTCCTGTCCCGATTGACACTAAAACTGTCCCCTCCTGTATGGTGCCCACACCCTTC +AGGGGAAACCCCTGGATAAACAGCAGTCACTGCAGGTCTCCAAAAAGACAAGGCCGGAAC +AGGGAACCTGGGGTGCATGTTCAGGAAGCTGTGGCAAGTGTTGACACCACAGCCCCAAGT +TTCTTTTTCTGGCCCGCGGAAGATGAGCTTCAGTCCCATGGAGGTGACAAGGTTGTCCTC +CTGCATGATGGGGCTCTGCGGTGCCTCTGCGCCTGGGTAACCCCTCACCGAGAAAGCCAC +GTCTACAGGTCCCACCTGTCTGCAGGTGTGCCGCCCCCAACTCCAGGCCTGTGTGACTTA +GCGACTGTCCCAGATCTCTCCTGGGAAGTGGCGCAGGGGCCTGGCCCTCAGTGAGTCCCA +GAGGGACCGCACCACCACTGACTTCACTGTGCTGCTTGGAGCTGGGGAGATGTGGAAACG +GCCACTCCAGACCCAGTGACTGGCTGGTGCTTAGGATGTGATTTCCTCATTACTGAAATT +TGTTTCAAGTGTACAGAAATCACCATCGGCCACGTGCAGTGGCTCACGCCTATAATCCCA +GCACTTTGGGAGGCCGAGGCGGGCGGATCACCTGAGGTCAGGAGTTCGAGACCAGCCTGG +CCAATATGGAGAAATCCTGTCTGTACTAAAAATACAAAAATTAGCCGGGTGTGGTAGCGG +AAACCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATTGCTTGAACCCAGGAGG +TTGGAGGTTGCAGTGAGCCGAGACTGCGCCATTGCACTGCAGCCTGGGCAACGGAGTGAG +ACTTTGCCTCAAAAAAAAAAAAAAAAATTTCACCAAAGCCCCTGGGGGTGGTGGTGCACT +GCGGAGTTTATAGCCTTCCTGGGTGGCAGAGGGCAACTGGGCCCCTGAGCACAGAAGTGG +GGCTCCCGCGGGGGTGGGGCTGGCTTGGAAGGTCCCCATTCCTGTGGTGCATATTTGATG +AGGGCCCATGTCGTGCCTGGAGCTGGGCCAGAAGCCACAGTGCAGTGCAGTGGGGACAGA +CCCAGCCTGTCCATGGGCTTGGTTACTGTCAGCCTGGCCGTGTCAGGGAAGGCTTCCAGG +CCACCCACACAGCTGCACCACACCCAGACAAGCTCTCCAAGGGACATCATGAGACTGCTC +CACTGTCAGAGCCCCGGGCCGGTGGTCCCAGCAACTTGGGGTGCCTGCTGTCCTTCATGT +GACATTTTCTTCATTCAAAGCTCAATTTAAACAGCAAGAAGCCTCCCTGCCTCCTACCTG +GCAATTTCCCTGCCCCGCACCTTGGAGGCAGCCCCTGCGCAGTTTGCATCTGGTGATGGC +CAACGTTTGCCACCCTAGTACTTGACCCTATTTAATCCTCACGGCAGCCCATGAAGTAGG +TACAGTGGTCAGTGCCATTTCACAGATGAAAAGACAGAGGCTCAGGGAGCTTCAGCCACG +TGCACAGCTCAGCCGTCAGCCTGCACGTCTCCCCACGGGGCCTGGGTCTCCGTCTGACTC +CCCTAAGTCGAATGCCTGGGGCCTGGAGCCCATTCTCTTGTGTCCCTAGGCCAAGGGCTG +GAGATCAGGTCTAGGGGAGAAGGGAATTCCCAGGGGTGTGGTTCAGGTGTGTCCTGGGAC +AGTCTCCCAAGGGCAGGTCCCTGATTCCCCTCTGCCGAGGCCTCAGGGTCCACCCCTGCC +AAGCAGAGCCCAGCGCAGGTGATTTGGCTGATAAAGGAAGATGGGTCTCTGGGGAGGCAG +CAAGTGGCCCACTTTCTTCTTTGCTTTTTTTTTTTGAGATGGAGTCTCACTCACTCTGTC +TCCCAGGCTGGAATGCAGTGGCACGATCTCGGGTCACTGCAACCTCCGCCTCCCGGGTTC +AAGAGAGTCTCCTGCCTCGGCCTCCTGAGTAGCTGGGATTACAAGCACCTGCCACCATGC +CCAGCTAATTTTTGTATTTTTTGTAGAGATGGGGTTCACCATGTTGGCCAAGGCTGGAGT +GGCCAGCGTTTCTGCCTATTGACACCTGCCTGCCAATACAGGGTCGGTCACACAGAGCCA +GCGTCATAGGTACCTTGGGGCCCATCCTGCTGCCCTAGGCAGGAGGGAGAGCTGGTCCTG +TGGGCTGGCCCAGGAGACGGTCACCCAGGGCTGTCCAAGGGGATGGATCCTGGCTGTCAC +TCGCTCAAGAAGAGGCAGCAGGAGAGGCTTAGGTTAGATCTGGGAAAGAACTGTCCCACC +CAAAGGCTGATTTGCTCCAGTCCTGGGAACTGCTAGATTCCCTCTCCTGATAAAATGTCC +CAGAGGGCACTGCGTGGGTCCCATGCCCTGACGCCAAGTCGCCTTTCTCCTGATATGGTA +CCCACTGGCCTGGCCTTGGGGATTTCCTGGTTAAAGAAATAGCGAGCTCAGCCCATCTGG +GGAAAGCCAAGTGGCCTGAGGGCGGAGACGGTGACATTTGGAAAAAGGCCAGGACTGGCA +GCTCAGACCTGGAAGCCCCCACTCCCTGCCAGCCTGGCTTGAGGTGAGAGCCTTCCTCAT +GAGCCCCCTACCCCCACTCATTCATTCATTCATTCATTCACATTGTTCAAGGGCAAGGCA +TGAGAGTACAACAGTTAAATCATGGGCCTGGGTCCAGACTGCCCAAGTTCAATCGCGGTT +CTAGCCTGGCGCGATGGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCTGAGGCAGGCA +GATCACTTGAGGTCAGGAGTTCGAGACCAGCCTGGGCAACATGGTGAAACCCCATCTCTA +CAAAAAATACAAAAATTAGCCGGGCGTGGTGGCACGAGCCTGTAATCCCAGCTACTCGGG +AGGCTGGCACAGAATTTCTTGAACCAGGGAGGCGGAGGTTACAGTGAGGCAGGATTGCGC +CACTGCACTCCAGCCTGAGTGACACAGCAAGACTCTGTCTCAAAACAAAAACAAAACAAA +TCCCAGTTCTGCATATACCAGCTGTGGCAATCTGTTTTCCTCTCTGTTTTCCCATCTGTG +AAGTGGGGAAAATTGTACCCACTCCCTGACAGCCTCCTTGTGAGGAGAAGATACGGTCAT +AAATAGAAAGCACCTAGAATAGTGCCTGACGTAGGGCAGGGCGGCGGGGTGCAGGGGGCC +CTTCCTATTAGCACTCGGGACGTGGGGGAATTCTTGGGGCCCTGGTATTGTTCTAACACC +CAGTGATGGTTCACCAGCTGTCTCCTTTATAATAATTAGGTAAGAGATGTGGTTTTCTAC +ATATTTCACAATACAAACATTTTTAGAAATTCTATTTCCTTCCCCTGAAAAAACTCTCTT +ATCTCTTTATTACTTCCTTCCTTAACTTTATTTTATTTTATTTTATTTATTTATTTTTTG +AAACCAAGTCTACTCTGTTACCCAGCCTGGAGTGCAGTGGTGTGATCTCGGCTCACTGCA +ACCTCTGCCTCCCAGGTTCAAGCGATTCTTCTGCCTCAGCCTCCCAAGTAGCTGGGATTA +TAGGCTTGCAATGCCATGCCTGGCTAATTTTTTTATTTTTAGTAGAGACCCGGTTTCACC +GTGTTGGCCAAGCTGGTCCCGAACTCCTGACCTCAGATGACCCACCCACCTTGGCCTCCC +AAAGTGCTGGAATTACAGGCATGAGCCACTGCACCTATCTTTTTTTTTTTAATTAAAAAA +ATTATTTGGTACCTTGTTTCATCCATGCATTAAATTAAATCCTGGCCAGACACAGTGGCT +TATGCCTGTAATCCCAGCATTTTGGGAGGCTGAGGTGGGAGGACCACTTGATACTGGAGC +TTGAGACCAGGCCGAGCAGCATCTCGAGACCCCGTCTCTACAAAAAAAAAATAATAATAA +TAATAATAATAAATAAAAAGTGGAAAAAATCCTATGTCATCCTGAAAAAAGGCTGTAAGC +CTGCTTACAGAGGTCATTACAAGGTCAAACTCAAGTTCGGAGCGCTTCCTGCCTCTGCTC +ATCCAACAAACTTGCTGGATACCTCCTGTCTGCAGAGCACTTTGAGGGAACATAACAGGG +TCTTGGGAGGCCACAGGAGGAGAGTTGAAAGATCACAGCCAGGGGCTCAGGGTGTCCACA +GGACAAGTACCCTTGGCCAGGCAGTTACGCAAGTGTGGAAAGACTGCTAGAGGAAGGGAA +GGAAGTGCCGAGAGCCCACAAAATTCTCTGCTTACAACCAGCCCCACTAGAACCTTCCTC +TGCCCTGCCTCGACATGCCCAGGAGAGCACCGCTGCAGGTCTGGCCTCTGTGCTGAGCCT +TTTTTTTTTTTTTTTCCTGAGACAGAATCTCACTCTGCTTCCCAGGCTGGAGTGCAGTGG +CAGGATCTCGGCTCACTGCAACCTCCACCTCCCTGGTTCAAGTGATTCTCCTGTCTTACC +CTCCGGAGTAGCTGGGATTACAGGTGTGTGCCACCATGCCCAGCTAATTTTTGTATTTTT +AGTGGAGACTGGGTTTCACCATGTTGGGCCAGCTGGTCTTGAACTCCTGACCTCAGGTGA +TCCGCCCACCGTAGCCTCCCAAAGTTCTGGGATTAGAGCTATGAGCCACCATGCCTGGCT +ACCGTGCTGGGCCTTTCGAGGAGGCATTTGACAGGGAAGATGAGAGACAAATTGAGTGTC +AGGGAAGGGGTGTTGATAGAAAAATTACAGGAGAGCACACAACTTTCAGCGGGTGAGCCC +AGTGCCTGAGCTGCGGGACCACCCTACCAATGACCTTGAACTTATCTGACTGCAGCCTTG +AACTCCTGAGCTCAAGGAGTCCTTCTGCCTCAGCCTCCTCCCAAGTAGCTGGGACTACTG +GCACATGCCACCATGCCCAGCTAATTATTTTATTTATTTTATTTTATTTTATTTTATTTT +ATTTTATTTTGAGATGGAGTTTTGTCCTTGTTGCCCAGGCTGGAGTGCAATGGTGCAATC +TCAGCTCGCCGCAACTTCTGCCTCCCAGGTGCAAGCGAATTCTCCTGCCTCAGCCTCCTG +AGTAGCTGGGATTACAGGCATGTGCCACCACGCCTGGCTAATTTTGTATTTTTAGTAGAG +ACGGGGTTTCACCATGTTGGCCACGCTGGTCTCGAACCCCTGACCTCAGGTGATCCACCT +GCCTCGGCCTCCCAAAGTACTGAGATTACAGGCATGAGCCACCGCACCTGGCCCCACTTG +TGGAACTAGCATCTATCTGGAGAGGAGGCAAACATCGCCCACCACCTCCCGCTCTCTCCT +GTCACCACTGTCCCCACCATCATTCCAGAGGTCACCCTGGCTTCCAACACCACAGCCTGG +CTTGGGCAGTTTTCAAGCCTCGTATAAATGACATCCTCCAGAACATGTGCTCTGTGCCTG +CCTTCCTTCCGTCAGTGATGTATCTGGAAGATTCCACTGTGTCGCCCTGTGGGACAGGTC +CTTGTCATTGCTGAGTAGATCCTGTTGCAAATGCCTATCTCTCTTCATGGAAAGATCCAA +GATACACAGATGGAAATCATCATAGGAAGGGCTGGCAAGGCCGTTCACACCCAGGGCTGG +GGACCTCAGGGTGGAGGTGGGGGACAGTAAGGACCAGAAGGAGCAGGTGCCGGCGGGTGA +TGTGAGCTTTCTTCTCTATAGAGAAGTGAAGGCCGGGTGCAGTGGCTCACTCCTGTAATC +CCAGCGCTTTGGGAGGTCGAGGCGGGCAGATCACTTGAGGTCAGGAGTTCGAGACCAGCC +TGGGCAATTTGGTGAAACCCCATCACTATAAAAATACAAAAAATTAGCCGGACATGGTGG +TGCACGCCTGTAATCCCAGCTATTTGGGAGGCTGAGGCAGGAGAATTGCTTGTACCCGGA +AGGTGAAGGTTGCAGTGAGCCGAGATCATGCCACTGCATACCAGCCTGGGGGACAGAAAG +AGACTCTGTCTCAAAAAAAAAAAAAAGAAAAAAAGAAGTGAAGCACTTGCCAAGCAAATC +TTTCAGAGCAGGTGGAGTGGACCCTACACCTCTTGGATAATAAATGCACTGGATAATAAA +AGCAGGAACAGGCCAGGTGCGGTGGCATGTGCCTGTAGTCCCAACCTACTGGGGAGGCCA +AGGCAGGAGGACTGCTTGAGCCCAGGAGTTGGAGGCTGCAGTGAGTTATGACCAGGCAAC +TGCACTCCAGCCTGGGTGACAGATAGAGACCCTGTCTTTAAAAAAAAAAAAAAAAAAAAA +AGGGCCAAGCACAGTGGCTCATGCCTGTAATCCCAACACTTTGGGAGGCTGAGGTGGGTG +GATCTCCTGAGCTCAGGAGTTCAAGACCAGCCTGGCCAACAGGGTGATACCCCTTCTCTA +CTAAAAATACAAAATTAGCCAGGCGTGGTGGCGCACACCTGTAATCCCAGCTACTTGGGA +AGCTGAGGCAGGAGAATCGCTTGAACCTGGAAGGCAGAGGTTGCAGTGAGCCGAGATTGT +GCCACTGCACTCCAGCTTGGGCAACAAGAGCGAAACTTCGCTTCAAACAAATAAATTAAC +GCCCAGCATGTCTTGGCTTTCATCTGCCAGACCTCAACCCTCACCCCCAGGAGATCAGGT +CCGGACCATGAGCTGACCCTGGACTCAGGCAAGGGTGAGTTGGTGCAGCCCTGGCCTGCT +GGGAGGCACAGGCTGCAGCAGGCTGCCTGGGGCTGAGGCCCGCCACTCATGAACTCATGA +CCTTGAATGAGCTCCAAAAGCTCTGGGCCTCCCAGGCTCTAGGGGGAGTGGGAGAGAGAG +GCCTCAGCCTGTCCCTGGGCATGCTGCCCCCTCCTCACCTCTTTGTCCCAAATCCCCTTC +CTGGCAAAGCTGACAGTCTTAATATCACTCTGGAGAAAACTGAGTCAGCCCTAAGGAACA +ATTCAATGAACCATTTGCTTACTTGAGGATTGGAACTCAAGTCTCACTCAAAGTCTGTGC +CATTTTCGTCCCAGCTGTCACTGGCCCTCATCCACACACACCCAAGGATGAGCATCTAAC +GCTTGCATGCACACTCCCATGCCCGCGTTCATTCACTCATTCATTCATTCATTCACTCAT +TCATTGACTCATTCATTCATTCACTCACTCATTCATTCACTCAGTGAATGTTGCAGTCAC +GATCCAAATATTTATGGCCTCTGTGTGCCAGGCACTAGATGGAGGGGCTGGGGCTAGAGC +CCCTGATAACCCGGTCATGCCCTAGCTTTCCTGGGACACACATTGTGGTAAGGGGAGACT +AAAAAAATTAAGTCAGGCCAGGCACGGTGGCTCATGCCTGAATCCCAGCACTTTGGGAGG +CCGAGGCGAGTGAATTACCTGAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGAGAA +ACCCAGTCTCTAATTAAAAAAAAAAAAAATTAACCAGGTGTGGTGGCACATGCCTGTAAT +CCCAGCTACTCAGGAGACTAACGCAAGAGAATTGCTTGAACCCAGGAGGCAGAGGTTGCG +GTGAGCCGAGATCGCGCCATTGCACTCCAGCCTGGGAAACAAGAGCGAGACTCCATCTCA +AAAAAAAAAAAGTGGGAGGCAGAGGCAGGAGGATCACTAGAGGCCAGTAGTTTGAGACCA +TCCTGGGCAACATAGCAGGACCCTGTCTGTACAAAAAAATTAAAAAAAATTTAACCGGGC +ATGGTGGCACACACCCGTAGTCCCAGCTACTCCAGAGGCTGAGGCAGGAGGATCGCTGGA +GCCCAGGAGTTGGAGGCTGCAGTGAACTGTGATCCCACCACTGCACTTAAGCCTGGATAA +CAAAGCAAGACCCTGTCTCAAATAACAATAGCAATAATAATAAAGAAAAATTAAATGCAA +TTTGCGATGCATCAGTGATAAGTGCTCTGCAGAAAAAGGAGGCAGGAAGAGGCTGAGAAA +GGTATGAGGTTTGCTATGCAATGTGAAGTTATCAAGGAAGGCTTCTCGGAAGAGGTGACA +TTTGAGCAGAGAAATGGAGGAGAGTTATGGAGGGAAGATGGTGAATGGGGGGAACATGGT +CAAGACCAGGAATATGGTCAAGGGGGGAAAGATGGTCAAGGGGACGCAGCAAATGCAAAG +GCCCTGAGGCAGGAGCAGCTTGATTCACCCCCAAAACCCGTGGGGCCCGTGCAGGCGACG +GGAAGGACAAGTGTAAACCCTTTTCCTTGTCCCTGCAGGTGTGTGTGAACATGAGTCTGC +CCATGTTTACACCCTGCAAGCCTGAAGAGTCCCCAGAAACTGAAAGAAGAAGCAAAGCCC +TTTCTGTACCCTCCCTGCCCCCTGTCCCGACCGCGACAAAAGCGACTTCCTCTTTCCAGT +GCATTTAAGGCGCAGCCTGGAAGTGCCAGGGAGCACTGGAGGCCACCCAGTCATGGGGGA +CACCTTCATCCGTCACATCGCCCTGCTGGGCTTTGAGAAGCGCTTCGTACCCAGCCAGCA +CTATGTGAGTAGCTGGTGGAGGGCATCCCGTGGGGGGAATACGGGAGGGACAGCACGGCC +ACCCTTGCAGTCCCAGGGCCAACCAGCTCCAGTGAGGACTAACGGGGCAGGGTCTTGGGC +ACCTGGTCCCTGGTCTTTGAGCCTGGATCTACCCCTCTGATCCCTGGGAAGACAGTTCCC +TTGGACCCGCCCTGGGCCCCAGCCCTTTACTGTCCCCGCCTGTGTCCCCAGCCAGGCCCT +CAGCCTTAGCCAGGAGTCCTCTTTCTGCTCCCCTGCCATGGCCAGGCAGCCCAGCGCTCT +CTCAGGTCCGAGGCCCACTCCTCCAGGAAGCCTTCCCTGACTAGCCCAGCTATCAGAGAG +TGGCCCTCCCAAGAGGGAGGCCTGGAAACTAAAGCTCTCTCTCTCCCCAGCTGCCTGTAG +TGTCAGTTAGAGTCTTATCCTCTCCAGTAGGGTGACACCATGACAGGGGCCAATAGAGTC +CTCCCATCTGTCCCCAAGGAGGCTGGACAAATGCCTGCTCAGACACACAAGTCCACTGGG +TCCCCTAATCCCATAGGAAGGCCAGGGAGGAACTACATTTAGGAAATTGAAGCTTGTATG +GAACATTTAGTCCTATGTGCCAAGACCTTTCTCTTTTTTGTTATTTTTTTGTTTTTTGAG +ACAGAGTCTTGATCTGTTGCCCAGGCCAGAGTGCAGTGGCACGATCTCAGCTCACTGCAA +CCTCCGCCTTCCAGGTTCAACTGGTTCTCCTGCCTCAGCCTCCAGAGTAGTTGGGATTAC +AGGTGCCCACCACCACGCCTGGCTAATTTTTGTATTTTTAGTAGAGACAGGGTTTCACCA +TGTTGGCCAGACTGGTCTCAAACTCCTGACCTCAAGTGATCCACCCACCTGGGCCTCCCA +AAGTGCTGGGATTACAGGCATGAGCCACCGTGCCTGGCCTGTTTTTTTGAAATGAGGTCT +GGAGTGCAGTGGTGCGATCATAGTTCACTGCAGCCTCGACCTCCCAGGCCCAAGTGATCC +TCCTGCCTCAGCCCCTTGAGTAGCTGGGGCTACAGGCGCACACCACCATGCCTGGCTAGT +TTTTAAAATTTTTGTGGAGATGAGGTTTCACTATGTTGTCCAGGCTAATCTTGAACTCCT +CGGCTTAAGCAACCCTCTGGTCTCAGCCTCCCACAGTGCTAGGATTACAAGCGTGAGCTA +CCGTGCCTAGTCACTTTTCTCCTTTTCTTTGTAACTTTCAGTTTTGAAATTTCAAATTTA +CAGAAAGGCTACTGGGTGTCAAAACGGTACCAGTCACTCCAATAGTCTTTCACTCACCTT +CATCCACACCTCTCTTTCTGGGGATATTTTCTGAATTATTTGAGAGTGAGTTGAAGACGT +GTTTCTTTACCTCTAAATACTAGTTGTTGGGCATTTCTTAAAATCAAGGCATTCTCTTAC +ATAATCACAACACACGTGTCAAAATCAGGAAATTAACATGGACAAAACACCATTATCCAC +CCACAGACTTTACTGAGGTTTCCCCGATTATCCTGCTTGTCCTCTGCAGTGAAAACTTTT +TTCAGGTCTAGGATCCAGTCAAGGATCAATGTCATAGCCTTTAACCTTCTTTAATCTGGA +TCAGTCTTTTTTCTTTTTCTTTTTCTTTTTTTGGACACGGAATCTCACTCTGTCGCCAGA +CTGGAGTGCAGTGGTGCAATCTCGGCTCATTGCAACCTCTGCCTCCTGGGTTCAAGAGAT +TCTCCTGCCTCAGCCTCCTGAGTAGCTGGGAATACAGGTGCGCGCCACCATGCCCAGCTC +GCATTTTTTGGTAGAGACAGGGTTTTGCCATATTGATTCTGGATCAGTCTTTTTTTTTTT +TTTATGAGATGGAGTCTTACTCTGTCACCCAGGCTGGAGTGCAATGGCACAATCTCCACT +CACTGCATCCTCCGCCTCCCAGGTTCAAGCAATTCTCGTGCCTCAGCCTCCCGAGTAGCT +GGGATTACAGGCATGCGCCACCATGCCCGGCTACTTTTTGTATTTTTAGTAGAGACAGGG +TTTCACCATGTTAGCCAGGCTGATCTCGAACTCCTGACGTCAGGTGATCTGCCCGCCTCG +ACCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTGCCAGCGGATTCTGGATCGGT +CTTAATCAGTCTTTGTCTTTTGCAACTTTGATGTTTTGCAGAGAGCAGACCAGTTACCTT +GTAGAATGTCCCTTAGTTTGGGTTTATCTTCATTAGATTCAGTTTGTGTATCCAGGGCAG +TGGATCTTAGATGCAATTCTGTCTTCTTTTTAATTTTTTTGAGAGGGAGTCTCGCTCTGT +CACCCAGGCTGGAGTGCAGTGGCACAACCTCAGCTCACTGCAGCCTCCGCCTCCCGGGTT +CAAGCAATTATCCTGTCCCAGCCTCCCAAGTAGCTGGGATCACAGGTGCCCATCACCACT +ACCGGGTAATTTTTGTGTTTTTAGTAGAGACAGGGTTTCACCATATTGGTCAGGCTGGTC +TTGAACGCCTGACCTCAGGTGATCCACCTGCCTTGGCCTCCCAAAGTGCTGGGATTACAG +ACGGGAGCCAACATGCCCAGCCTTCCTGCCCCTCCCGTCCCCTCCCCTCTCCTCCTGTCC +CCTCCCTTCCCCTCCCCTCCCCACCCAAGCTGGAGTGCAGTGGTGCAATCATAGCTCACT +AAAGCCTTGACCTCCAAGTCTCAAGCAATTCTCCTGCCTCACCTGGGGCCACAGGTGTGC +GGCACCACACCCGGACAATTTTTGTGTTTTTAGTAGATATGGGGGTCTCGCTATGTTGCC +CAGGCTGGTCTCAAACTCTTGGACTCAAGCGATCTTCCCACCTCGGTACTAAAAAGTGCT +GGGATTCCAGGTGTGAGCCACCGTGCCCAGCCTAGGTCCTACTTTTATCTCCAATTTACA +GATGAGTCCATTTGAGAGAAGCTGACCCTCTTGCCCTGGGTCTCAAGGCTGGGGCGTGGC +AGCACTTGGGTCCACGTTTGTGCCCTTTCTGCAATCCAGGACAACCGCAAAGATGGTCCT +CACCCCAATCCTCTGGGCTTCCTCCAGTGGGTAGTGGGATCCTGGGTGCACACAGCAAAG +CCTCTTTGGAGGCTGAATGGGGTCCCCCGACTCTGGCTTTCCCCCAGGTGTACATGTTCC +TGGTGAAATGGCAGGACCTGTCGGAGAAGGTGGTCTACCGGCGCTTCACCGAGATCTACG +AGTTCCATGTGAGTGTGGGGATGGAGGAGGGACAGGGACCCACCGTTCCAGCTCCACCCT +TTGGGAAGGACCTTAGCCCAGGTGATGGGGAAACTGCAGAACCCAGAATCCCCTCCCAGA +CCACAGTTAAAGGGGATTTATTTATTTATATAAATTTTTGTGACAGGGTCTTGCTCTGTC +ACCACTCTGAACACCTCATGTTCTCTGATTACAGGCATGAGCCCCCACGCTCGGCCTTTT +AGGTGGTTTTGAGAGGTATTTAGGTTTGCAGTGCAGGGGCGCAATCATAGCTCACTGCAG +CCTCGACCTCTGGGGCTCAAGCGATCCTCCTGCCTCAGCCTCCTGAGTAGCTGGGACTAT +AGGTGCGCATCACCATGTGTGGCTAATTTTTGTATTTTTTATAAAGATGGGGATCTCACT +ATGTTGCCCAGGCTGGTCTTGAACTCCAGACCTCAAGTGATCCTCCTGCCTTGGCCTCCC +AAAGCTAAGGGGGCATTAAAAGAAAAAAACATTTTTCCCCCTGAAACATTTAAGTAGTCT +TACTGAAAACAATAAAACACAGAAACACCAGATTCTCATTTTAAAGTAAAACAGACAGGA +TCTCCCAGAACCTTCCTAGAATGGAACCATTCTTGTCGCTTTTGAAAAACAAAGCCAAGT +TCTAGATCCCAAATAAATGCACCTGCTGGTGAACATTCTCCTTGTGGTTCTCGTCCCTAT +GTTAGTTATTTTCCTAAATTTTACATTTGTACCTTTTTAAGAATGAGTTATCAGTTTTTT +TATATTTGCTTTTCTTTTGAGATGGGGTCTTGCTCTGTCACCCAGGCTGGGGTGCAGTGG +TGCAATCACGGCTCACTGCAGCCTCAACCTCCAGGGCTGAAGCGATTCTCCCATCTCAGC +CTCCCATGTTGAGATCACAGGTGTGCACCACCACACCTGGCTCCTTTTCCTGATTTGTTT +TTTGTAGAGATGGGATTTCGCTATGTTGCCCAGGCTGGTCTCTAACTCCTGGACTCAAGT +GATCCTCCCGCCTCAGCCTCCCAAATTGCTAGGATTACAGGTTTGAGCCCCTGCACCTGG +TCAACCTGAGTTTTAAGAGGATCCCTTTGGCGACTGGATTGAGGACAGACAAGAGTGGAC +GGGGGACACAAGGAGGCCATTTTCGTTATCCAGGCCTGGTAGTGGCTAGGGCCAGGAGGG +TGGGGTTGGTGGGAAGCAGTCAGATCCCAAAGAGATTTGGGGATTGGAAGCAAAAGGATT +TGCTGGTGACTTGCACATGGGAGGGAGAGAGGTCAGTGCCTCTGCTAATCAAGGAATCCA +GATTGCCACCGAAATTTCTAGGCCCGAGATATTTAGGTAGTGTCTCACTCTGTCACCCAG +GATGGAGTGCAGTGGCACCATCTCGGCTCACTGTAACCTCCGCCTCCCAGGTTTAAGCGA +TTCTCCCACCTCAGCCTCCTGAGTAGCTGGGATTACAGGCATGTGCCACCACTCCCGGCT +AATTTTTGTATTTTTAGTAGAGACGGGGTTTCACCACGTTGGCCAGGCTGGTCTTGAACT +CCTGACCTCAAGTGATCCACCCACGACAGCCTCCCAAAGTGCTGGGATTACAGGCGTGAG +CCACCATGCTCGGCCTTTTAGGTGGTTTTGAGAGGTATTTAGGTCACTTCCAATCTCGTG +CTTTTCCAAGTGTTGTAAACTACAAATATTCCTTCACGTCTTCTTGTCTTTTTAATGTTT +AGAAAACCTTAAAAGAAATGTTCCCTATTGAGGCAGGGGCGATCAATCCAGAGAACAGGA +TCATCCCCCACCTCCCAGGTGAGCACGGGGCTGAGCCGCCTGTCAGGGGGTCATTGGCGG +GGGCTCACCTGCCCTCCCAGCCCCTCTCGGGCTTGACCTCATGTTCTCTGGTGCCAGCTC +CCAAGTGGTTTGACGGGCAGCGGGCCGCCGAGAACCGCCAGGGCACACTTACCGAGTACT +GCAGCACGCTCATGAGCCTGCCCACCAAGATCTCCCGCTGTCCCCACCTCCTCGACTTCT +TCAAGGTGCGCCCTGATGACCTCAAGCTCCCCACGGACAACCAGTGAGTGAACTTTTCAC +CCTGCCAGGTGGGAGAGGGAAGGAGGGGTGGGACTTTCTGTGTTTTGCAGATGAGGAAAC +CAAGGCTCAGAGAGGGAAAGCCACCTTCCCAGAGCCACACAGCCAGAAAGAGGAGGCAAA +TTCCACCTCCGGCCCCTGTGACCCCGCCAAGCCTCCACCTTAATCTTTCACACCTCAGGG +CACTGGGGGAAGCACTCGGGGCTGGAGGTTCAAAGTCCTGGGTCCTCATCCTGACATTAT +GGCCACCTGGCCATGGGACCTGGAGCCAGTCACCACTGCTCTCTGAATGCAGGTTCTCCA +TTTCTATAATGGGCAGTGAGGATCAGATGAAGCATTGGGTGTCTTGCGGAGCCCCCCAGA +AGGATGTGGGGTTGATGCCTCTGCTAAGTGCTGAGCATGTCTGGGGTCTCCTGTACCCAG +GACCCTGTGTGGAAGGCACCTGAGAGGCTGAGGGAGCTCCAGGCAGGCTGGGGAAGTCCC +CTTCTCCACTCCTCTCTGGTCACTGAAGCTCGAAGTGGGGAGCATGAGGACAGGACGTTA +CCCCTTGTCAAGGCACCCAGGCTGCCAAGACAGAGACAAGCAGCATTGCTCCGGCCAGCA +CTTATTGACGCTTGAAGGTGTCCCCTGGCCCAAGGAAGGGCAGTTATCATCAGCCCGGGA +GGCGGGGGAAGGATGGACTCTGCAGTGGGGTCCGCTCCTCATTGCCTGCTCTCTCAGGGC +TCCAGAAGGAGGAAGAGGCCGGGCACAGTGGCTCACACGTATAATCCCAGCACTTTGGAA +GGTCGAGGTGGGCAGATCACCTGAGGTTGGGAGTTTGAGACCAGCCTGGCCAACATGGTG +AAACCCCATCTCTACCAAAAATATAAAAATTTAGTCAGGCATGGTGGTGTGCGCTTGTAA +TCCCAGCTACTTGGGAGGCCGAGGCAGGAGAATCGCTTGAACCCGGGAGGCAGAGGTTGC +AGTGAGCTGAGACTGCGCCACTGCACTCCAGCCTGGGTGACAGAGCGAGACTCTGTCTAA +GAAAAAAAAAAGAAAAGAAGAAAGAAGATGGCCTGGGAGCCCGCAAGAGCATTTTCCAGG +CTTAGGGCATCCTTTGGGTCTGCAGAAGGCTATGCAGTGTCCTCCTCATGTCCCTCCCTT +GGGCTGCCCGAGCAGATCCGCCCGCCCCCATCACTTCCTGAAGCCCTTCCTCAGCCAGTC +CAGTTGCTGTCTTCTCTCCGCAGTGCCCCTTCCCTTTCCCGGGTCCCTCTTCTCTTGGGA +AGTTCTTCTGCAGGTCTACCCAGTGCCTCTTCTTCCTCCATGGGAAGCCAAGGGTCTCAC +CCAGACTGTTCTCTCCTCAGGACAAAAAAGCCAGAGACATACTTGATGCCCAAAGATGGC +AAGAGTACCGCGACAGGTGAGAGGACGGGGGGCAGCCGGCGGGGGGGGACACCCTGAGGA +GACCCAGAGTGTTCAGGGAATGGAGCAGGGGCTGGGAGCAGGCTGGGAGGGCTCACAGCT +ACCCTGCTGAAGAATTGGGTCTTTGGGCCGGGTGCGGTTGCTCATGCCTGTAATCCCAGC +AGTTTGGGAGGCCGAGGCAGGTGGATCACTTGAGGTCAGGAGTTTGAGACCAGCCTGGCC +AACATGGAGAAACCCTGTCTCTACTAAAAATCCAAATTAGCCAGGCGTGGTGACAGGTGC +CTGTAGTCCCAGCCACTTGGGAGGCTGAGGCAGGAGAATTGCTTGAACCCGGAAGACGGA +GTTTGCAGTGAGCCGAGATCGTGCCACTGCACTCCAGCCTGGGCAGCAGAGCCAGACTCC +ATCTCAAAAAAAAAAAAAAAAAAAAAGAAGAATTGGGTCTTTGGAAGGTCCCTGGAGACT +GAAAGGAGCCCTTTGCAGGTGGCAGTGCAGAGACCAGCGCAGACCCTTGCTACTGGCAGC +CGGGGGAGTGTTTGCGGCTGAATGAATGAACAGGTTTTGGAGGGCAGTGTGGCCTTCAGA +GGCGATGCAGGGCTGTGGCAGTTTCTAATACTTATTGCACAGTCACTGCTAATAACAATA +ATAATAATAATACCTAACATTAATGGAGTGCTTACTCTGTGCCAGCCACTATTTTGTTTT +TGTTGTTTTCAGTGACAGGGTCTCGCTCTGTTGCCCAGGCTAGAGTGAAGTGGTGTGATC +ATAGCTCACTACAGCCTCGACCTCCTGGGCTGAAGCGATCCTCCCACCTCAGCCTCCCAA +GTAGCTGGGATTACAGGTGTGTGCCACCATGTCCAGCTAATTTTTAATTTTCTGGTAGAG +ATGGGGTCTCACTACATTGCCCAAGCTGGTCTTAAGCTCTTGGCCTCAAGCAACCCTCCT +GCCTCAGCCTCCCAAAGTGCTGAGATTATAGACATGAGCCACTGTGCCCGGCTTTTTCTT +CTTCTTATAAGGACACGAGGCCTGTTGGGTTAGGGCCCACTCTACTGACCTCATTTTAAT +TTAATTACCTCTTGAAACGTACTTAAGAGTACCTTTCTCTTAATACACCCACACTGTAAG +GTACTGGGTGGTTAGGACTTCAACATATGAATTTTGAGAAGGCGGATGTCAGCCAATACT +AAACAGCATCAGCACCTCCACGGTTGGATGAAGGGCTGGTCAGAAATGCACACTCAGGTC +CCACAGTGGACCTACTGAACAGGATAGGCATTTTAGCAAAATCCCAGGTATTCGGGTGCA +CCTTAAAGTTAGGAAAAGGTCAGGCACTGTGGCTCATGCCTGTAATCCCAGCACTTTGGG +AGGCCGAGGCGGTTGAATCACCTGAGGTCAGGAGTTCGAGACCAGCCTGACCAATATCGT +GAAACTCCATCTCTACTAAAAATACAAAAATTAGCCAGGTGTGGTGGCGGGTGCTTGTAG +TCCCAGCTACTTGGGAGGCTGAGGCAGGTGAATTACTTGAACCTGGGAGGTGGAGGTTGC +AATGAGCCAAGATTGCACCACTGCACTCCAGTGACAGAGCGAGACTCCATCTCAAAAAAA +AAAAAAAAAAAGTTGGGAAAAGGCCAGGTGCAGTGGCTCCACACCTGTAATCCCAACACT +TTAAGAGGCTGAGGTGGGAGAATCCTTTGAGCCCAGGAGTTCGAGACCAGCCTGGGCATT +GTCCCAAGACCTTGTCTTTACAAAAAATTAGCCGGGTGTGGTGGCATACGTCTATGGTCC +CAGCTATTCGGGAGGCTGAGGCAGGGAGATTGCTTGAGCCTAGGAGTCCAGGGCTGTAGT +GAGCTGTGATCACGTCACTGTACTCTAGCCTGGGCAACAGAGCAAGACTCTGTCTCCAAA +AAAGAAAATAAAGTTGGGAAAGGCTCACTAACTTCATCAGATGAGAACAAGGACATGTTT +GAAGTGTGAGGCCGAAGCCTGGAGAACGCTATGCGCCCAGGAAATGCAGGGCAGCAGAGA +CTCAAGATGCCAGCGCCTGTTCTGGAGGCCCAGATGGGCCCTGCAATGCCCACTCACCCT +GCCCTCCCTCTTGCCCCAGACATCACCGGCCCCATCATCCTGCAGACGTACCGCGCCATT +GCCAACTACGAGAAGACCTCGGGCTCCGAGATGGCTCTGTCCACGGGGGACGTGGTGGAG +GTCGTAGAGAAGAGCGAGAGCGGTCAGACCTCCCACCTTACGGGGCTCCTTCCCCTGGTG +CTCAGGAACCCACAGCCACAAGCCCCCTGCCAAGGCTCAGGCAGCCTTGCCCCTGGGAGG +ACTCCGGCTCTGTTAGGGGCCCTAAATGTCCTCCCCACACTGTGGGTCGCCTTCTGTCTT +AGTGTGCACCCTGTGGTGGCTGTGGGCATCTGTGCATGGCAGGCCGGGGCGGGGCATGTC +TGCGTGTTCTGTCTGGATGGGTATGGGACCGTCTGTTCATTATGAAGTGGGCTCAGAGCT +GTGATTCTGTGAGCATGTGTGCATGCATGCATGTGACCTCATTGTCCAGTGTGGTGAAGG +TGACATTTCCAAATCTGAGCATTGGACATCAGTGTGTCTGTGTCCCTGTGTCCTCACCAT +CCCTGATGGCTGCAGGGAGCCGCTGGGCCCTGCCCCTCAGTCACATTCCCGCACCTCTGG +CACAGGTTGGTGGTTCTGTCAGATGAAAGCAAAGCGAGGCTGGATCCCAGCGTCCTTCCT +CGAGCCCCTGGACAGTCCTGACGAGACGGAAGACCCTGAGCCCAACTATGCAGGTGCCCC +CTGCCCTCCGAGGCTGTAGGGGTGTGGGAGAAAGGGGCAGGCAGGGCTCAGGGATATTGA +GTGACTGCTTTGGAGTCTGGGCTGGTTGCTGGCTTGGCAGAAAAGTCAGGGCTAAGATCT +CATCGACTCTGGCTTGGGGGCCCTGGCAGGTTGTGATGCCCTTGGTCTGGACAGGGAACC +AGGAGGAGGAGCAGACGACTGGGGAGAGTGGGAGGCCAGTGGTGTCTGTGGATATGTGGC +CAGGTTCAGTGGGAAGCTGAAGGATGAGCAGACCTTAGGCTCAGGAAGGAGGGCTGCCTG +GAAGTGGGGGCATCATCACTGACCAGAAAGGGAAAACTGGCAGTGCCAGGGCTGGATGGG +GCCTGCATTGAGCTTGAAAAAAACTATAATAGAATTGGTTACCATTTTATTTTATTATTT +ATTTATTTATTTTACTTTTTTGAGATAGAGTCTCACTCCCTTGCTAAGGCTGGAGTGCGG +TGGTGCTATCTCAGCTCACTGCAACCTCTGCCTCCCAGGATCAAGTGATTCTCCAGCCTC +AGCCTCCCCAAGTAGCTGGGATTACAAGCATGCACCACCATGCCTGGATAATTTTTGTAT +TTTTAGTTGAGACGGGGTTTCACCAGGTTGGCCAGACTGGTCTCGAACTTCTGACCTCAG +GTGATCTGCCTGCCTTGGCCTCCCAAAGTGCTGGAATTACAGATGTGAGCCACTGTCCCT +GGCCTGGTTACCCACATTTTAAAATGGAGTGATTTCACCCTTTTATGTGGATTTACAGCT +TTTTTTTTTTTTTTTGAGACAAAGTCTGGCTCTGTCACCCAGGCTGGAGTGCAGTAATGC +AATCTCAGCTCACTGCAACCTTAGCCTCCTGGGTTCAAGCAATTCTCCTGCCTCAGCCAC +CTGAGTAGCTGGGATTACAGGCATGCACCACCACGCCAGGCTAATTTTTTGTATTTTTAG +TAGAGATGGGGTTTCGCCATGTTGGCCAGGCTGGTCTCGAACTCCTGACCTCAGGTGATC +CGCCCGCCTTGGCCTCCCAAAGTGCTAGGATTACAGGTGGGAACCACCTTGCCCAGCCTG +TGGCTATCGTTTAAACACTGGGAAGGCCTGCAGCCCCCAGGCCGACAGTTAGCTGCAGCT +GAGCAGTTCCCAGTGCCAGGTAGACGGATGCTCCACCCACCTACTCATGGCTGATCTCTT +GTCATAGTGAAGTGTCTGGACAGACCTTCATCGTTATGGGATCTCTGGTCCCCAGAGTGG +GTGGCAATGAATGGGAGTGGACAAGCTCACCTGGGTGTAGGGGGCAGAGGGCCGAAGTCC +AGAGTGTACCCCCAGAGTGGGTGCCAGCAGGAGCTTGCCGAGGGATCTGGGATGGAGCAG +GAGGGTGGAGGGAGGAGACCCAGAAGAGGGGGAACTGTGGGCCCTGGGTGGGTCTGGAGT +GCCTGGAGGAAGCCCAGGCGCAGAGAGGAGAAGATGGGATGGGTGGCGAGCCCCAGGCTG +GGCCGACCTCACACTGTGCTCTGTGCCCCTGCCGTGGACCAGGTGAGCCATACGTCGCCA +TCAAGGCCTACACTGCTGTGGAGGGGGACGAGGTGTCCCTGCTCGAGGGTGAAGCTGTTG +AGGTCATTCACAAGCTCCTGGACGGCTGGTGGGTCATCAGGTAGGAGGGCCCCTCTCCAT +CCAGAGCACCCATCTGAGTCAGCCCCAGCCAGGACGGGGTGTTTAGGGATCTGGGGTGAC +TTGTCCCTGGGACTCTGGGTAAGCCACTGCCCCTCTCTGGGCTTAGTTTCCATCTCAGTA +GCAGGGAGGAATGAGCCCACCCTTGCCTGTCTTGTGGGGATCCAATGTCCTTGTCCAAGT +GGGTGCATTTCTCCTTTGTGATTTAGGGTCTCTTCCCAACCATCTATTATTATTCCTTCT +CTGGCAACATGGTGAACTGTTGTATAAATAATTACATTCCTAGCTAGGCGCAATGGCTCA +GGCCTGTAATCCCAGCACTTTGGGAGCCCAGGACAGGACGATCATGTGAGGTCAGGAGTT +CGAGACCACCCTGGCCAACATGGCAAAACCCTATCTCTACTAAAAACACAAACATGAGCC +GGGTGTGGTGGTGGGAGCCTGTAATCCCAGCTACTCGGGAGTCTGAGACAAGAGAATCAC +TTCAACCCGGGAGGCGGAGGTTGCAGTGAGCCAAGATCGCGCCATTGCACTCCAGCCTGG +GCAACGAGAGCGAAACTCCGTCTCAAAAAAAAAAAAAAAAAAAAAGATTACTTTCTTTTT +ATCATTCCTTTATCTTTTAAAGCTTTCTTGCAGTCAGGTGCAGTGTCTCATGCCTGTAAT +CCCAACACTTTGGGAAGCTGAGGTGGGAGGATCACTCAAGGCTACAAGTTCAAGACCAAC +CTGGGCAATGTAGGGAGACCTCTGTCTCTACAAAAAAAATTAAAAAATAGCTGGATGTGG +TAGCACACACCTGTAGCCCCAGCTACTCAGGAGGCTGAGGTGAAAGGATCACTTGACCCC +AGGAGTTGGAGGCTGCAGTGAGCTATGACTGCACCACTGCACCCCAGCCTGGGTGATGGA +GCAAGACCCTGTCTCAAAAAAAAAAAAAAAAAAAAAGCTTCCATTGCAATTCCCATCTGT +TTATCCTCCAAATGAATGCAGAAATACTAATTATCTTTTTTCTGGTTCTGGGGAACACAG +AATTCTAGCGGCTTGTGGAGCCATTTCCCTGGAGCCATGGGGCCTCCCAGGTCCTTTCCT +GTGTCTTCATTTTTTACGAATTTTTTCATTTTTTGAGACAGGATCTTGCTCTGACTCCCA +AGCTGGAGCACAATCATCGCTCACTCAAGCGATCCTCCCACCTCAGGCTCCCACGTAGCT +GGGACTACAGGTGAGCACCACCACATCTGGCTAATGTTTTTTAATTTTTTTGTAGGGATG +GGGTCTCACTATGGTGCCAAGACTAGTCTTAAACTCCTGGCCTCAAGAGTTCCTCCTGCC +TTGGCCTCCCAAAGCACTGGGATTACAGGAATGAGCCTCCATGCTGGGCCTTTGCTGGCG +TCTTCAGAGCCCTAGGTCACAGGGCCAGCCTGGCGCCCTGCCGCAAGCTTATCTTAAAGC +TGGGACCACAACATGCATACCTGCAGCCGGGCCCGGGGCCAGAGGGCTTTGAGGCAGCAT +TTCTCAGCCTTTTAGACACACACTCTGTTAACCCCCATCCTGTGTCTCTGATAATCTTCT +TGTGATCCTCCCACCAGCCAAGAATTGGGTTTTATGTGAACCTTGTATTATGCAAAGTTT +TCTTTTGTTTTTTTTTTCACTCCCAAATATAATATTGAGAATAGAAAGAAAGTCTTTTCA +ACAAATGGTGCTGGAACAGATGGATTTCCATACTGGAAAAAAAAAAAAAAGAGCAAAAAA +CAAACCTAGACCCCTTCCTCACACTGTACACATATGTTTACTTCAGATGGATCACAGGTT +TATCCCAGAGTAAAACCTGAAACTAAAAACCATTTGGGGCTGGACAGGGAGCTCACGCCT +GTAATCTCAGCACTTTGGGAGGCTGAGGCAGGTGGATCACTTGATGTCAGGAGTTTGAGA +CCAGCCATGACCAACATGGTGAAATCCTGTCTCTACTAAAAAAATACAAAATTAACCAAG +TGTGGTGGTGCATGCCTGTAATCCCAGCTACTTGGGAAGCTGAGACAGGAGAATTGCTTG +AACTTGGGAAGCAGAGGTTGCAATGAGTCGACATCATGCCATTGCACTCCAGCCTAGGCA +ACAAGAGCAAAACTCTGTCTTGGGGTTGGGCGGGGGAAAAGCATTTGGAAGAAAGCATAG +AATTTGGTGGCTTGGAGGTAGGCAAAGGTTCGTAGGAGACAGAAGGCAGTTAACATAAAA +GAAAAATTGGCAAATATAATCCGCCAATGTCTTCTTTTTTCTTTACTTTTTTCGGGAGGT +AGAGATAGGGGTCTTGCTATGTTACCCAGGCTGATCTCCAACTCCTGGCCTCAAGCGATC +CTCCCACCTAGATCCCTCAAAGTACTGGGATTACAGGCGTGAGCGACCGTGCCCTGCCCA +TTCTTGCCAATGTCTTATAGCAAATACCTGTCCCCTGCGGTGACCTGGATCTGCTAACCT +CCACCCCTGCCTAGACTGTGGAAGGATTGCTGGAAGGGTCTCAGTTGCACAGACCAGGAA +ACTGAGGCCCACAGAGGCAGGTGTCCGGTTGTTTGCAACCTCTCAGCCTGTGCTAACCCC +AATTGTTCAGAGAGAGCCCTGAAACCCTCTCCTCTGGGCGCCCCCAGGTGACTGCCCCAG +CCTCAAGGGCTGCCTCTGTTGCAGGAAAGACGACGTCACAGGCTACTTCCCGTCCATGTA +CCTGCAAAAGTCAGGGCAAGACGTGTCCCAGGCCCAACGCCAGATCAAGCGGGGGGCGCC +GCCCCGCAGGTAAGCGGGGGTCCCCGGGGCTGGGCGGGGTCGAGCGGGGCGCACCACGGG +TTCGCTCTGTCTAGGCCATAGCTTGGCAGTGCCGGGGCGGGGGCTCTCAGCCTGGCAGGA +GAGGCAGGACCCTCACGGGGGAAAGGGGCTGGACGCGCCTGGCCGCGGTGTGGGGCTGGC +ACGGGGGCGGAAGGAAAGCGGCGATGCCCGGGGGCTTTGGGGATGGGCAGTCCAGGGGGG +GTCCCCGGAGAGGGGGACGACAGACCGAAGGCTGGTGAGGGGCGTGGAAAACCGCCCAGG +CTCTGCTGCAGGGCAAGGGTCCTTGTCGTGACGGGGGCAGCCGCCTCTTGTCCCGCCGGG +GTCGTGCAGACTACCGGCCCCCTACTGCCCCCCACTTCCTCGGACCAGGGGTGCCCATCT +GAGTCCCTGGGGGCAGGGGCGCCCTCGGGCTTTGACGACGCCCCGTCCCGCTGGGCCAGG +TCGTCCATCCGCAACGCGCACAGCATCCACCAGCGGTCGCGGAAGCGCCTCAGCCAGGAC +GCCTATCGCCGCAACAGCGTCCGTTTTCTGCAGCAGCGACGCCGCCAGGCGCGGCCGGGA +CCGCAGAGCCCCGGGAGCCCGCTCGGTGAGTGCAGCGGGAGAGGGCAGGAAGGGCAAGCC +CTAGAGGCGGAGTCAGCGGGAGAGGCGGGGCCAGAGGTAGGGCCAGAGTAGCGGGGCGGG +ACCAGAGGGCGGAATCAGAGGGAGAGGCGGGGACTGGAGGCGGGGTCAGAGGAGGAGCCA +GCGCTAGGGGGCGGAGCGATCCCTAAGAGGCGGAGTCAGAGGGAGAGGCACAAGCGGGAG +GCGAGGCCAGAGCGCGGAGCAGGAGTTGGAGACCGCGGCGGGGCGAGGCCAGAGAGCGCT +GTGGGCGGGGCCAGTGTGCGGGGCGGGGCGTCTGACTCGGCCCCGCTCTCTGCCCGCAGA +GGAGGAGCGGCAGACGCAGCGCTCTAAACCGCAGCCGGCGGTGCCCCCGCGGCCGAGCGC +CGACCTCATCCTGAACCGCTGCAGCGAGAGCACCAAGCGGAAGCTGGCGTCTGCCGTCTG +AGGCTGGAGCGCAGTCCCCAGCTAGCGTCTCGGCCCTTGCCGCCCCGTGCCTGTATATAC +GTGTTCTATAGAGCCTGGCGTCTGGACGCCGAGGGCAGCCCCGACCCCTGTCCAGCGCGG +CTCCCGCCACCCTCAATAAATGTTGCTTGGAGTGGACCGAGGCTCTGCAGGAATGCAGGG +AGGGCCGGGCTCCGCCCCAGGGTTATTTCTAAGTTGAGGACAGGAGGTTGTGAGTTCTGC +TGGGGGGAAGTTGCAAGAGCCGAGGTCTGGTTGCATGTTGCCCTGGTCTTGGCCAAGAAC +AGGTTTGCACAAGGCCAAGTTCAAGAGGAACTCCCGGTTTCCTGCTGACCGTTTGGTCAG +AAACCACCTGCTTGGACTCTGGCGGAAGAGTGCTGAAGATGGGTGCACACAGTGCAGCAG +GGCAGCCCTGTCTCATGACAGGAGACAGGCTGCCGTCCAGGGTGTAGGAGTGACCTCATA +GCTGGGATAAAAAATATATTATAACTTAGGTTCGGGCGCGGTGGCTCACGCCTGTAACCC +AGCACTTTGGGAGACCGAGGTGGGAGGATCCGTTGAGCTCAGGAGTTCGAGACCAGCCTG +GCCAACATGGTGAAACCCCATCTCTACCAAAAATATAAAAATTAGCTGGGCGTGGTGGCA +TGCATCCATAATCCCAGCTACTGGGGAGGCTGAGGCATGAGAATCGCTTGAACCGGGGAG +GCAGATGTTGCAGTGAGCCGAGACGGCGCCACTGGACTCCAGCCTGGACAACATGGTGAA +ACCCCATCTGTACCAAAAATATAAAAATTAGCTGGGCGTGGTGGCATGCATCCACAATCC +CAGCTACTGGGGAGGCTGAGGCATGAGAATCGCTTGAACCGGGGAGGCAGATGTTGCAGT +GAGCCGAGACGGCGCCACTGCACTCCAGCCTGGACTACAGAGCGAGACTCTAGCTCAAAA +AAAAAAAAAAAAAAAAGTAACTTAGGTGCAGGGTGTCCTCTGTTATTCACTGAGACCGTG +CCCCGGTTATGAGGTTGTACCAGAAAGCAAGTATTCACTATGCACACTATTCACCGCTCA +CCCTAGCATTGAAGCCAGCCTGTAGCCTGAAAGCCTTTGCTTTGAGGGCAGGTCTTTCCC +CAAAATGCAGACACGAAGGTGCAAAGTGAAGCTGCCAGTCTTGCAAAAGATGTAACTTGT +CACGAAGGCCACGAGTGGCAGGGAGAGCTGTCCCACATTTGCGGAAGTGGCTATGTGAGG +ACGGGGGAGGCGGGTCCCTTAGAGATAAGAGACAATCATAAGGGGAGATATCAGAGAAAA +TCGTAAGGGGAGCAGATGGTTGTCAAGAGAATAGGCTGACCATCGAAGGACTGGCAGAAG +CTTTCAGAAAACCACTGGACGGCTGGGCACAGTGGCTTAGGCCTGTAATCCCAGCACTTT +GGGAGGCTGACGCGGGTGAATCACTTGAGGTCAGGAGTTCCAGACCAGCCTGGCCAACAT +GGTGAAACCCCATCTCTACAGAAAATATAAAAATTAGCCAGGCGTGGTGGCACAAGCCTA +GAATCCCAGCTACTTGGGAGGCTGAGGCAGGCGAATGGCTTGAACCCAGGAGTCAGAGGC +TGCAGTGAGTCGAGAGTGTTCCACTGCACTCCAGCCTGGGTGACAGTGCAAGACTCCTTC +CAAAAAAAAAAAAAGAAGAAAAAAGAAAACCACTGCAGCTCTAAACTAGTTCTGCATTTT +TGCCGAACCTGGTTTGCTGGAAAAGCCCAGCACCAAAGGCTATCATACAAAGCTGTGGGA +AATTGAATCACCAACCTCACCCCTTCTGCTTGTTCAGTTGCAGTTATAACCCTTTTATTA +AATACAGTATAAAATACCACGCCTCTAATCCGAGTGCTCTGGGAGGCCAAGGTGGAAGGA +TTGCTTGGGGCAGGGAGTTCAAGACCAGCCTGGGCCACACGGTGAGACCCATCTAGACAA +ACATTTTTAAAAATTAGACAGGTGTGGTGGTGTGCACCTGTAGTCCCAGGCTGGGTGGGA +GGATCGCTTGAGCCCAGGAGTTTGAGGCTGCAGTAAGCTGTGATCGTGCCACTGTACTTC +AGCCTGGGTGACAGAGCAAGACCCTGTCTCTAAAAAAAAAACAAATTAAGGCCAGCCACA +ATGTTTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCAGGCGGATGACTTGAGGC +CAGGAGTTCGAGACCAGCTTGGCCAACATGGTGAAAGCTTGTCTCTGCTAAAAATACAAC +AACAACAACAAAATTAGCCGGGTGTGGTGGTACACGTCTGTAATCCCAGGTACTCAGGAG +GCTGAGGCGGAAGAATCACTTGAACCCGGGAGGCAGAGGTTACAGTGAGCCGAGATCACG +CCACCACACTCCAGCCTGGGCGACAGAGCATGACTCTGTCTCAAAAATAAATAAATAAAT +AAATAAAAATAAAAAAATACATACATATAAAAAAGAAGAGAAAATACTTATTTTCATGAT +TGTTTCATTTTTTTCCAAGCTGAGGTCCTGACCAAATGTTTCCCCGTGGTTTTTGTATAT +TTCTGATCCCCTTAAAGTGGCCCTTGCAGCGTGCTGGGGAGGAGGCCTCTCGGTGGGTGG +GTGATTGGGAAGCCACGCCCACAGGGAAGGGAGAAAAAAACTGAAGTTGCCTGCTCTAAG +GGCTGCACCTCTGTTTAGCCAACAATTTTCTTGAGGCCAGTCATAGTGCTGGGCTCATTC +CATCATCTCCAGTTCTGAGACCAACACTGTCTGGTAGGTGTTTTATGGATGAGGAAACCA +AAGCTCATAAAATTAATTAAGTGGTTTGCTTATGAAATAATGCAAGAAAGCAACAGTGCT +GGGAGGTGGAACCGGGTTTTTCTTTTCTTCTTCTTTTTTTTTTTTTTGATGGAGTTTCGC +TCTTGTCACCCAGGTGGAGTACAATGGAGCGACCTCAGCTCACTGCAACCTCTGCCTCCC +GGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGTGCCCGCCA +CCCTGCCCAGCTAATTTTTTGTATTTTTAGTAGAGATGAGGTTTCACCATGTTGGCCAGG +CTGGTCTTGAACTCCTGACCTCAGGTAATCCGCCTGCCTTGGCCTTCCAAAGTGGTGGGA +TTACAGGCATGAGCCACTGCGGCTGGCCCAGGCTTTTCTTTTTGATTCTAAGGCCTTCCA +GATCCAGTACTTTATCCTGACCCTGCAGAGCTCAGGATCTGTGGTTCAGGCCTGCGGCTC +AGAGGAGGGAATACGGCACACAGGTACGTGCCAGGCCAAGTGTGAGGGGGTCTGGCTTCC +AGGGCCCTCTGCAGACCCCTAGTCCCAGGGCCTGTGTTGGAGGAGAGATTGGCTCTTTCC +TCTGCCCATCCTGGGATGAGAAGTCGGGGACTTGGGATAGATGCAGTGCAATCCCTGCCC +CTGAAAATTGACAAAGACCCACCAAATCTAGCCCCTACTCCTAGGCTGGGCCCCTGCCCA +TCTCCCTGGACCACACCACTCTCAAGGGCTCTCGTTTGCAGACACCCCATTGCCCTACTA +AAAACCTCTCCTGGCCAGGCTTGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCT +GAGTTGGGTGGATCACCTGAGGTCAGGAGTTCCAGATCAGCCTGGCCAACATGGTGAAAC +CCCGTCTCTACTAAAAATACAAAAATTAGCTGGGTGTGGTGGGGGGCGCCTGTAATCCCA +GCTGCTCGGGAGGCTGAGGTAGGAGAATTGCTTGAACTCGGGAGGCAGAGGTTACAGTGA +GCTGAGATCGTGCCACTGCGCTCCAGCCTGGGCAACCGAGCAAGACTCCGTCTCAAAAAA +ACAAACGAAAAACCTTTCCCAGCCATTCAGTCATTCCCACAGTCTCAACTCAGTCCTATG +AGTGACAGTGCATGTCAGTGGCCATCATATCTCAAGCCATCCTGGTCCCAACACACATTC +CTGGGGCCTTGGGAATTGATTCAAAGCAGAACAGCTTCATGAATGGTCCGGCCAACAGGA +GGCAGCCTAGGCTGAGCCCTACTGTCCCCTCCCTATCATCTGATTGGTGGACCACCAGGG +AGCCACACACATGACAGATGATGAGGGCAGAGGCTGCATGACAGATACCTGCTGGGTCTC +CATGTCAGGCACAGTGGCTGCTTAGGAATGAAGCACATGGGCCAGGTGTCGTGGCTCACA +CCTGTGATCCCAGCACTTTGGGAGGCCAAGGCGGGTGGATCACTTGAGGTCAGGGGTTCA +AGATCAGCCTGGCCAACATGGTGAAACCCCGTCTCTACTAAAAAATACAAAAATTATTCG +GTTGTGGTGGCGCATGCCTGTAGTCCCAGCTACTCGGGAGGCTGAGGCACGAGAATCACT +AGAACCCGAGAGGCGGAGGTTGCACTGGGCCAAGATCACACCACTGCACTCCAGCCTGGG +CGACAGAGCGACACTCCATCTCAAAAACAAAAAGTGAAGCACATGGACTTTGGAGTCACA +TGGACCCTGGTTTGAATCCTGACAACTCCTATAATGGCTGCGTGACCTGGAGCGAGCCAC +TTAGCCACTCTGAGCTTCAGCTTCCCGTCTATGAAAGGGGGCTGCTCTGGTCCTGCTGCT +CGGCCACACCTCTGATATGTGGTGTGAACGAGTGCTCACTTCCACCAAGACCTGGACTCC +CCTCCAACTCCCGTTATAAACCAGCCTATCTGGGATTCCTTCTCCAAAAGAGCGCTGAGC +TTGCCAGAGCCAGCTGTACCTGAAGTCAACGACAGGAACTGCCTGGAGTGGGGTCATTTC +CCTGTGTCTAAGGATAGGCACCTGGGCTCCAACTGGGCTCCTGGCCTGGGGGTTGCTCTC +TCTCTCCTGCACCCCCTGTCATTTTTATCAAAGTCCTATTCTCCATTGCTTCCTGAGTGG +GTCATTAGGTGGAGATCCACAGCCTTCCTCCACGCTGGTCGCGTGAATTCCCCCAATCTG +GAAAGTATTCACAATTTTGTGTCACTAATTCCAGTGACTAATAGAGATCACACACACACA +CACCTTCAAATGACAACCTGCCAGGAGAAAAATGCTATAAAGGGAAAGATATCACTTTGG +GAAGCTGAGGCGAGTAGATCGCTTGAGCCTGGAAGTTTGAGACCAGCCTGGGCAACAAAG +GGAGACCCTGTCTCTACAAAAAAAAAAAAAAAAAAAAAAAAAAAACCACAAAAAACTCCA +CAAAAATTAGCTGGGCATGGTAGCATGCACCTGTAGTCCCAGCTACTTGGAAGGCTGAGG +TGGGAGGATCACTTGAACCCAGGAAGCAGAGGTTGCAGTAAGCCAAGGTCGCACCACTGC +ACTCCAGCCTGGGTGACAGAGCGAGCCGATTTCCTTGTTTCCAAAAATAAAAAAGGGAAA +GATATTATTGGGTCAACAGAGAAAACTAGAGTATGAACAGTAAACTGGATAAAATAATTG +CAACAACGTTCAATTTACTGAAGTTGGTAAAGGAAACGTTATTGTGTAAGAGAATATCCC +TGTTCTCTGAAAATACTCACTGAAGTATTTAGGGGTAAATGATATACGTAACTTTCCCTT +GAACGGTCCAGGAAAAAAATGAACATCCATTTATACACATATCATGGATACTCATAGACA +TTTGCTTATACACACTTACCATAGGTACTGATTATAGATACACATACACACATATGAGTG +AGAGGGAGAAGGAGGGAAGGGGGTAGGGAGACAAAGTGATCCAATAATGAAACAAGGGTG +AAATGTTAACAATTGAGAGTCTGGCTAAAGGGCATGTGAGTATTTTCCATACTATTTTTA +TTTTTGCAACTTTTCTTTTTTTTTTTTTTTGAGACAAAGTCTCACTCTGTCGCCCAGGCT +GGAGTGCAATGGCACAATCTCGGCTCACTGCAACCTCTGTCTCCTGGGTTCAAGTGATTC +TCCTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGCACGTGCCACCATACCCGGCAAAT +TTTTGTGTTTTTAGTAGAGACAGGGTTTCACCATGTTACCCAGGCTGGTCTCGAACTCCT +GACCTCAAGTGATCCACCCACCTTGGCCTCCCAAAGTGCTGGGATTACAGGTGTGAGCCA +CATGCTTGGCCACAACTTTTCGGTAACTATTCATAGTAAAAAACAAACAAAAAAACCCCT +CTAAACCTTAACTTACTTTGTCTAACTTTTATAGACAAAGTCTACGTTATTTGCTCTGGG +GTTTTCCATTTTAAACCTGACCTTTCTGGCTCTGGGTTTTTCCATTTTAAACCTGACCTT +TCTGGTTCCAGGTGAAGGCAGAGACAGATAACATAGGATTATTGTATGTCAGTATGTTTT +CAACTATTTCTCCTGAAACTTGGAAACGTATTAGACCATGTGGGATACCACGCGGACGGG +AACGGGGGATAAATGTGTGTTCATATATACTCCTCCACAAATATACATGTCTCAGGCTGG +GCGCAGTGGCTCACGCCTGTAATTCCAGCACTTTGGGAGGCCAAGGCCGGCAGATCACTT +GAGGTCAGGAGTTTGTGACCAGCCTGGCCAACATGGTGAAACCCTATCTTTACTAAAAAT +ACAAAAATGAGCCGGGCGTGGTGGTGGGCACCTGTAACCCCGGCTACTCGGGAGGCTGAG +GCAGGGGAATCACTTGAACCCCGGAGGCAGAGGCTGCAGTGAGCCCAGATCGCCCCATTG +TACTCCAGCCTGGGTAACAGAGTGAGACTCCGCCTCAAAAAAAGAACCCCCAAAACCAAA +AAGCAAATATACACGTCTCTCTCCCTATTTCTCTGTTGATTGATTTAAACTTCAAGATGC +CAACTACAGTGCCTATCAGGGTGGCAGGCAGGTAATGTGAATGAATGAAACAAGCCAGGC +ATAAGAAAAGTCAACTACCAATAATACAATAAAACTTTCTTGATTTTTAATGAATAGTGA +GGCATACAATGTAATATAAACAAGTATGATACTGCAGATTATATTTCTGATTCAAAGTGG +AAAAAAAACTGAAAAAAAAAAAAGTTTAAGAACTCATTTTGTCAGCTGGGCACAGTGGTT +CATGCCTGTAATCCCAGCACTTTGTGAGGTCGAGGCAGGTGGATCACCTGAGGTCAGGAG +TTGGAGACCAGCCTGGCCAACATGGTGAAACCTCATCTCTACTAATACAAAAATTAGCCA +GGCATGGTGGCGCACGCCTGTAGTCCCAGCTGCTCGGGAGGCTGAGGCAGGAGAATCGTT +CGAACCCAGGAGCTGGAAGTTGCAGTAAGCCGAGATCACGCCACTGCACTCCAACCTGGG +CGACAGAGCAAGACTCCATCTCAAAAAAGAAAAAAAAATTCATTTTGTCATCTCCCAATC +CCTTGGGACTAGAAGACTCCAGCCTTTCCCACCATAGGGCCCTGCCAGGAGTTTTCTCTC +CATCACGTTGCGATGTGGAGTACAGAATCCCACTGGGAATCCTTTAACTGGGAGCAGTAT +TTTGTTTTGCTCAGTTTCATAATGGAGAACAGCTGTTCGCAGATGTAGGTGCTCCCGAAC +ATGGAAAGAATCTTTGCGCAATGGTGCTTGTATTTCGGGTAGCTACCCCAGAGGTACTTG +TAGAATTCTGGTATTCCCACCTTGTCGTATTTCGTCTTCAGGACCGTGTTGCATTGCAGG +TCGATAACCTCCATCTGGAGCTCCTCGTGCACACTGTCGATCTTCGTGGAGAACGGGGAG +CTGAACAGAGTCAGTTCGCTTTCGTAGAGTTTGAAATCAGACAGCCTTTTCTGGAATTCG +GTCTGGAGTTCCGCGATTTTGGGAATGTAGTTCAGGCCATCGCTTTCATTTCTGGAAGCC +AATTTCAGGGTGGGAAAGTGGGCCAGATTATTCCTCGTCAAATGAGTCTCCCAGAGGCAC +AGTTTTGCTAGGAACGCCCGGATCAGGTCATACATCTGCGTGACGATTTGGGAGTGTCCT +TGGAGAGAGATGTTCAAAGCGTTCAGATGCATCGTCATGTCAACCAAGAAGGCCAGGTCT +CGGATCCAATCTATGGAGCTCAGTTGAGGCAGGGGTTTCCCTCTGGATGACATGAAGGAG +TCGATTTCTTCCAAGGATTCGAAAAATCTCTTTAGCACGAGCCCGCGACTGAGCCACTTA +ATCTCCGTGTAGTACAGGAGGCTACCATACTGGCTGTCCAGCTCATAGAGCAAGGTTGTG +AACTCACTGTGGTTCAGTCCCCGGGAGCATATCCAGTTCACGGACTTCACTACCACGTCC +ATGACGTGGTCCATCTTCAACTTCTGAGCACAGAGTGATTCCGGATGAATTATACAACAG +ATGGACTTCAGTTCCGCACCCTTGCAGAACGTCGCCACCCTGGACTTCAGTTTTGTGACA +AGCCCGTTATTGGCATCCACCATCGCTGGGGTGCCAGTGGAGGCCACGCTTACTAATTTC +GACCAGTCGATACAGAAGTTTTTCAGGCTTTTCTCAACACGCGAAAAGATCTCGTTGCCA +GATTTTGTACCCGTCATGGGCACCGTGTCCAGAAGTTCTTCGGACACATCGAAATTCTCA +TCGACACCACGGATGAATATGGCCAACTGGGTGGTATTATTTATATCCGTGATCTCATCG +ATTGCGATAGAATATGCCACAAAAGACCTGATTTTTTCACGTAACTTCTCCCATAAGTTC +CCAGCTAGGTCCTCTACAGGCTGCACGGGGGATTTCTGGGTTGGACTTGGGTTTGCAAAC +ACTTGTTTTTGCTCGGGACACTCGGTGTCTGATGAGCCTAAGAGATACTTCCTGAGCCCT +TTTTTCAGCTCGTGAAGCTTCTCGTCACGCATTCTTTCCATATACTGGTCATAATGCTTG +CTGTGATTGGTTTGATAGTGGCGTCTTAGGTTATATTCTTTGGACACAGACATGCTTTGT +TTGCATATGAGACATGTTGGAATATTCTGTACTTCCACGAAGAAATACGCTCTCTCCCAC +TTTTCTTGAAACACACGGCCCTCCTGGTCTATCTTGCGTTTTCCCACTTTTGACAGAGAC +AGGGAGACAAAGATATTTCACTTTTCTCTTATCACTACTATGAGGAAAACAACAGCAAAT +GCTTGATGACGCACGAGAGGGAGGAAGCGGGGCGGGGCAGGGCGTGGTTAACAGGAGGGT +GACCCACCCTGCAGAGGGACGGCTGACCCTCAACTCCAGCAAACCGCTGCCAGGATGCCA +GCTGTGGCCAGATCTTCAAGTTTTCTAAAGAAAACCTGAAGACTGAATTTTTGTTGTCGT +TGTTGTTGAGACGGAGTTTTGCTCTGTCGCCCAGGCTGCAGTGCAGTGGCGCAATCTCGG +CTCACTGCAACTTCTGCCTCCTGGGTTCAAGCGATTCTTCTGCCTCAGCCTCCTGAGTAG +CTGTTATGACAGGTGCCTGCCACCACGCCCAGCTAATTTTTGTATTTTTAGTAGAGATGA +GATTTCACCATGTTGTCCAGGCTGGTCTCGAACTCCTGACCTCAGGTGATCCGCCCACCT +CAGCCTCCCAAAGTGCTGGGATTACAAGCATGAGCCACTGCACCCAGCCAGATCTTCAGG +TTTTCTAAAGAAAACCTGAAGATTGACTTTTATGAAAGAGTGCCTGGTTTGTGGTGATAA +TGACTCATTGCAGCCTGGAACTCCCTGGGCTCAGGTGATCCTCCCACTTCAGCTCCCAGT +TGCTGGGACTACAGGCATGCACCACACCGAGCTATCTTTTCTTTCTTTCTTTCTTTTCTT +TTTTTCTTTTTCTTTTTTTTTTTTTTTTGTAGAGCTGGAGTCTTACCTTGTTGCCCAGGC +TGGTCTGAAACCCCAGGCTCAAGCGATCCACCCGCCTTGGCCTCCCAAAGTGCTGGGATT +ACAGGAGCCACCGTGCCAGGCCTCATCCTTATTTTCAAAAGTACATGAGCCAAACAAAAG +ACACCTTTGATGAGGTTCAGCATGTAGCTGTGCTTGTTATGTCCAGTTTAAACAGGAATT +ATTTGATAATATGTTTGCATTTTCTTTTTAGAGACAGGGTCTTGTTCTGTCACCCAGGCT +GGAGTGTAGTATTGCAATTATGGTTCTCTGCTGTCTCAAACTCCTGAGTTTAAGTGATCC +TCCTGCTTTAGCCTGCCAAGTAGCTGGGGCTACAGGTGTGAGCCACTGTTTCCAGCTAAT +TTTTAAATTTTTTGTAGAGATGGGGTCTTGCTATGTTGCCCAGGCTGGTCTCAAACTCCT +GGCCTCAAGCAATCCTCTTGCCTTGGCCTCCAAAAGTCCTGGGATTATAGGTGTGAGCAT +TTTAATATATTTTCTCATTTGATTCCCAAGAAAACTTTGTAATAACAGAGATGGGAATGA +GCACAGAAAGGCATATGATTTTTACCTACTGTGAGTCTCAAATGACAAGGGTGACGGCCA +CAGAACCACACAAAACTCATTCGTATAAGTGTGTTCGAGTGTACAGGGGCTAGTGTTTTA +GATTTAAAGAACCTGGCCACCCTGCAGGTAATCAAGGTATTTCCAGAGTACACACACATA +AAAGTGCACCTTAAGAAAATGTAGGCCATGTACAGCGGCTCATGCCTATAATCCCAGCAC +TTTGGGAGGCTGAGGCAGGAGGATCGCTTGAAGCCAGAAGCTCAAGGCCAGCCTGGGAAA +CATAGTGAGACCCTGTCTCTACAAAAAAAAAAAAAAAAAAAAATTATCTGGGCATGGCAG +TGCTGTCCCAGTTACTCGGGAGGTGAAGGTGGGAGAATCACCTGAGGGCAGGAGTTCCAG +GCTGCAGTGAGCTATGATCATGCCACTGCACTCCAGCCTGGGTGACAGAGTGAGACCTTG +TCTCTAAAAAACCCCAATAATAATACAATAAATAAATAAAGATATTATAAAAGATCAAAA +AATCATTTAGCAATCAGATGCGTTTGGGAATAAAAATGGAGCATTTTAATAGGATACTTT +GGTTTTCTTTTCTTTTCTTTTTTTTTTTTTTTGAGACAGAGTCTTGCTCTGTCACCAAAC +TGGAGTGCAGTGGCACGATCTCGGCTCACTGCAACCCCCGACTCCCTGGTTCAAGTGATT +TTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTATAGGCACGCGCCACCATGCCCGACTAA +TTTTTGTATTTCTAGTAGAGACGGAGTTTCACCACGTTGTACAGAAGGGTCTCCATCTCC +TGACCTCATGATCCGCGCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGTGTGAGTCAC +CGCGCCCAGCCTACTTTGGTTTTCAAATGTTACATTAGGAGGTTCCCTGGTGACTCATGC +TCGTGAGAACACCTCTCCGTATTCTACTTGACAGGATACTGACTCACTTGCAAGGGCTCC +GGGGAAGACATTAAGAATATTTAACAGGGTGGGGGCGGGGGGAGGGAGAGCATCAGGAAG +AATAGCTAATGCATGCTGGGCTTAATACCTAGGTGATGGGTTGATAGGTGCAGCAAACCA +CCATGGCACACGTTTACCTGTGTAACAAACCTGCACATCCTGCACATGGACCCTGGAACT +TAAAATAAAAGTTGAAGGGGAAAAAAAAGAGAATATTTCAGAAGCAGAGTGCCTGGGCAT +TGCTCAATCAGAACAGATGCTGAGCCAGGTGCAGTGGCTTACATCTGTAATCCCAGCAGT +TTGGGAGACCAAGGCGGGTGGATCACTTGAGGTCACGAGTTTGAGACCAGCCTGGCCAAC +ATGGCTAAACCCTGTCTCTACTAAAAAATACAAAAAGTAGCTGGATGTGGCGGCACGCAC +CTGTAATCCCAGCTAATCGGAAGGCTGAGGCAGAGAATCGCTTGAACCCGGGAGGCGGAG +GTTGCAGTGAGCCGAGATCTTGCCACTGCACTCCAGCCTGGGTGAGAGAGCGAGACTCTG +TCTCAAAAAAAAAAAAAAAGAAAAAAAAAAGAACAGATGCTAGTCTCAGCACTGGAAGGG +TTCTAGGGGCCTCTGCTGTGCCAGGTGGAACCCCTTTTGCTTCAGCACTGTAGGGAGGTC +AAGCCACGGTCGGAGGGTACTAGGGTGGGACTGCATGGCCAGGCAGGCACTATTTACCAA +CTAACACAGAGGAGATCGGTACTGTGATCCTGAGTGCAGCTGTGCGGGTGGCCTCAGGGG +AGCCCCCACCACAAAGCACACTTGAATAGTGTGCCACATCAGCCATGCGTGGTGGCTCAT +GCCCGTAATCCCAGCACTTTGGAAGGTGGAGGCGGGCAGATCCCTTGAGGTCAGAAGTTC +AAGACCAGCCTGGCCAACATGGCAAAACCCCATCTCTACTAAAAATACAAAAATTAGCCA +GGCGTGGTGGCACACGCCTATAGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATCACT +TGAACCCGGGAGGCGGAGGTTGTGTGGTGAGCCGAGATTGTGCCATTGCACTCTAGCCTG +GGTGACAGAGCGAGACTCCGTCTCCAAAAAAAAAAAAAAGAGTGCGCCACATCACACGTC +ACACTCATGGTGTGATATAGATCACTCTCCTTCAGACTGGTTAATCAAACTCAAGTAACA +GAGTTATCTAACTTTATCACATGCAGGAAAAATAAAGCATGCATCGAAGGCTGCATACTT +GGGTCCCAGGCTCACGGAAGCAAAAACCCCGTGGTGAGCGCCCACCAAGACACTTCCCAT +GGCCCAACATTGCCGGAACGTTCTTCTCACCTGTAGAATACTCACCATTACTGAGCTCAA +GCCCTGGAAGCGGCCTGAAGAGAAAGACACATTGATAAATGTGACAAGCTCACATTTCCT +CTTTTGCCCACTTAGTTTTATTTTTTTTTAATTTTTACTTATTTATTTTTTTACAGAAGA +ATATTTATTTATTTGTTTGTTTTGTTTTTGTTTTTTTTGAGACAAGAGTCTCGCCGCGTC +ACCCAGGCTGGAGTGCAGTGGCGCGATCTCGGCTTAGCGCAACCTCCGCCTCCTGGGTTC +AAGCCATTCTCCTGCCTCAGCCGCCTGAGTAGCTGGGATTACAGGTGCCCGCCACCACGC +CCAGCTAATTTTTTGTATTTTTAGTTTCACCATGTTGGCCAGGCTACTCTTGAACTCCTG +ACATCAGGAGATCTACCTACCTTGGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCAC +TGCGTTGAGCCTTTTGTTTTTGTTTTTTTTGAGACGGAGTCTCACTCCATCACCCAGGCT +GGAGTGCAGTGGTGTCATCTGGGCTCACTGCAACCTCCACATTCCAGGTTCAAGTGATTC +TCCTGAGTAGCTGGGATTACAGGCACGTACCACTACACCCAGCTAATGTTTATTTTTAGT +AGAGATGGAGTTTCACCATGTTGGCCAGGCTGGTCTCAAACTCCTGACCTCAAATGATCC +ACCTGCCTCAGCCTCCTAAAATGCTGGGATTACAGGCCTGAGCCACCATGCCCGGCCTAT +TTATTTATGTTTTGAGATGGAGGCTCATTCTGCTGCCCAGGCTGGAGTGCAGTGGTGCCA +TCTCAGGTCACTGCAACCTCCACCTCCCAGGTTAAGTGATTCTCACGCCTCAGCCTCCTG +AGTAGCTGGTATTAGAGGCGCACGCCACCACACCCGACTAATGTTTGTATTTTCAGTAGC +AACGGGGTTTCACCATGTTGGCCAGGCTTGCCTCATACTCCTGACCTCAGGCGATCTGGC +CCGCCTCAGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTGCCTGGCCCCACT +TAGTTTTATTGGACAAATTTTTGCAGAGTATCAACTCTACGCTAGGTGCTGTGTGAGCTA +AAACTGGGACGGGCTGCCCATGATCACCGAGGAACAGGGACATGGACACATCTCAAGGAA +GCAGAAGATGATGAAGTCAGTGTGAGAGGCAGCATGGCCCAGCGGTCAGCTGCGGGAACA +AACCCCCAGCCCAAGTCATGGGACAGACATTCCTGGGCAGCCACATGCCCACCTCGGGCA +AGTCAGAGTCTCCAGATTCCTTCTCTTGACTCACTTACCTGATGACTGTGAATTTGATAA +ACTCAGCTGCCTCCAAGATCCTCCTCATGGAACTGATTTCCAGATAGCCGGGGGCCTTGA +ATACCACCCCCGGGGGCATGCCATCAATCACCACACAGCCAGGGTTGAATGTGATCTTCC +TGTAGGGAACTTTCACAGGGAAATCCACGCCAATTGCTTCACCTGTGACGGGATGAGCAG +CATAAAACCAGCTGAGTTTGGCTGGGCACGGTGGCTCACACCTGTAATCCCAGCCCTCTG +GGAGACTGAGGCGGGTGAATCACTTGAGGCCAGGAGTTCGAGACCAGCCTGGCTAACATG +GTGAAACCCTGTCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGCGCATGCCTGT +AATCCCAGCCACATGGGAGGGACCCAGGAGGCAGAAGTTGCAGTGAGCCGAGATCGCCCC +ACTGCACTCCAGCCTGAGAGACAGAGCGAGACCCTGCCTCAAAACAAAACACAAAACAAA +ACAACAAATTAAAAAAACAACAACACAAATAAAACTAGCTGAGTTTGTTCCTTACGTTTC +CTAAACCAGGATTTTTCTTTAATGTCAGGATTTAGAAGCATCAAATGACAATACTTATGA +TCAGTCATTTTATTTTCCAGTGCTACTATGATGTGTGAATATAATTTTAAAAGTTTGGAA +TTAGCATGGGTAGTAGGCAAACTCAGTTCCTCCATCCATTACACAGGGTTATCATGGCGC +CTACCTGAAAGGTTTTATGTGAGGATTAAATGATCAAACACATGTTGAGCACAAAAAATA +ATATACAAGGTAAGCACTCAGTAAAACAAAGATAGCTATTATTATTATTATTGTAATTAG +TCAATGATACCATGCAAAAGCTCTTCTGTAAAAAGACATATTGACTAATTTTTATCATAG +CTCTTTCACAAAAAGATCAATTTCTTTTTTTTTTTTTTTTTTTGAGACAGGGTCTCACTC +TGTCGCCCAGGCTGGAGTGCAATAGCGCGATCTAAGCTCACTGCAACCTCTGCCTCCCAG +TTACAACCGATTCTCGTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGTGTGCGCCACC +ACACCCGGCTAATTTTTTTGTATTTTTAGTAGAGATGGGATTTTGCCATGTTGGCCAGGC +TGGACTTGAACTCCTGGCCTCAAGTGATCCACACACCTTGGCCTCCCAAAGTGCTGGGAT +TAAAAGTGTGAACCACTGCGCCCAGCCAAGATCAAATTCTTATAAGATAAAGTTTTGTTT +TTTTCCTTTTGTAGACCTGGGGTGTCACTTTGCTGCCCAGGCTGGTCTCAAACTCCTGGG +CTCAAGTGATTCTCTAGCCTTAGCCTCCTAAAGTGCTAGGATTACAGGTATGAGCCAATG +CACCTGGCCAAGTATTCTTTTAAAAAGAAGTATTTTAGGTATATGAATTCTGGATATAAA +AAGATATAAAAACTTACCAAATTTTCGGCTAAAGAGGTCATTAACTTGTTCTCTTAGCTG +TTTAATCTTTTCAATGCTTGATAATCTTTCCTTCTCATTATCTAAAAATAATTAAACAAA +TAAACAAACCAAGGTTATTAATGTATTTTCTCCCAAGAAAGCTGTTGGGAGAAATGCCTG +TTAGCACCCGAGAAAGTGCTTTACCTGGATTGTTATTCAGTCTACTTTTAGCAATAATTA +AGCATCTTGGAAATTTGGAAATGGAAGCCATTACAGACAATAGAGAATTTTCCAAATTAT +AACCCTATATAAACATACTACATACTACTTTTAAGGAATATTTTCAATATCATACAAGAC +AAGGATGTTTAGGGCCAGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCC +GAGGCAGGTGGATCACGAGGTCAGGAGATTGAGACCATCCTGGCTAACATGGTGAAACCC +CGTTTCTACTAAAAATACAAAAATTTAGCCGGGCATGGTGGCAGGCGCCTGTAGTCCCAG +CTACTCGGGAGGCTGAGGCAGGAGAATGGCGTGAACCCAGGAGGCGGAGCTTGCAGTGAG +CCGAGATCGCGCCACTGCACTCCAGCCTGGGTGACAGAGCAAGACTCCGTCTCAAAAAAA +AAAAAAAAAAAAAAAAGACAAGGATGTTTACTTTCACCACCACTTTTCGGCCTTAAAATA +GAAATCTTAGCCAATGAAATATGACAAGTAAAAGGAATAAGAGGTACTAGGATTAGAAGG +TAAGGTATATTTTTATTTTCTTTCCTTTTTTTCCTCTCTTTTTTTGTTTGTTTGTTTTGT +TTTGTTTTGTTTTGAGGCTGAGTTTTGCTCTTGTCACCCAGGCTGGAGTACAATGGTACA +ATCTTGGCTCACTGCAAACTCCTGGGTTCAAGCAATTCACTGCACCCCTCCTGGGTTCAA +GCAATTCTCCTGCCTCAGCCTCCCAAGTAGCTGGGATTACAGGCACCCACCACCACACCA +GCTGATTTTTGTATTTTTAGTAAAGATGGGGTTTCACCATGTTGGCCAGGCTGGTCTCGA +ACTCCTGACCTCAGGTGATCCACCTGCCTCAGCCTCCCAAAGTGCTGGGATTACAGGTGT +GAGCCACCGCACCCGGTCTGTTTTTCTTTTCTTTTTGTTTTTTAGAGACAGAGTCTCACT +GTGCTGTGCAGGCTGGTCTCAAACTCCTGGGCTCAAGTGATCCTCCTGCCTCAGCTTCCC +AAAGTGCTGAGATTACAGGCACATGCCACCATGCCTGGTCCTTTTTTTTTGTTTTTATTT +TTTAGATATTTTTCAACACTTTAAAACTTTATTTACTTTTGAATAACTAAAGCAATCACA +TGGCTCAACATTCAAGAGGAGTAATATACAGAAACATCTCAAACGTCTCTCTCCTATCCC +TATCTCAGCGGTCAGTTTCCTTCCCTGGAGGAACTATGTAATTAGATTCTCTTGTATCTT +TCCAGATATATTTTACATACACATATTCAGAAAAGAAGATTATTATTATTATTATTATTT +ATTTTTTTGAGACAGAGTCTCGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGTGATCTCC +GCTCACTGCAAGCTCCACCTCCCAGGTTCACGCCATTCTTCAGCCTCAGCCTCCCGAGTA +GCTGGGACTACAGGTGCTCGCCACCACACCCGGCTAATTTTTTTGTATTTTTAGTAGAGA +CAGGGTTTCACCGTGTTATCCAGGATGGTCTCGATCTCCTGACCTCGTGATCTGCCCGTC +TTAGCCTCCCAAAGTGCTGGGATTACAGGCGTAAGCCACCGTGCCCGGCCAGAAGATTGT +TAATGATGAGCAACAAAACATTTCACCTCTGTGGCCAATTCCAATTCAACCATAGCTGGT +GCTCCGTGCTGCCTGCTCTGAGATGCATTTTCCAGGTAATGCCCGGGCTTGTCCAGGAGA +AGCAAAATATCCGATTAATAATGTCTGATGTGAGCAAGATGCTCGTTGTGTAGCAACTTG +CAGAATATTTTATATTCCCGAAATGTCATTTCTTAGCTATCAGGGTGAACTAAGTGAAAA +ATGACAGGTCCAAGAGACCAGCCTATGTCAAAAAATAATTAAGACAAAAGGAAAAATGTA +ACATTAGTCCATACCTGGAACAGTCACTTGAACGATGTTAAGATCTTCAACACCTGCTGC +AGAATTTGTAACACTGGATGAATTTGTGTTTCCTTAAAACAGAAGTTGAAGTTTAGAATT +TACCAAGAATAAGACCAATTCTCCTTTAAATATGTCTAAGTGCTGCTTTGATCAGAAGCC +CAGACTGAATTTTTTTTTCTTTTTTTTTTTTTTTTTGAGACAGGTTCTTACTCTGTCATT +CAGGCTGGAGTGCAGTGGTGTGATCCTAGCTCACTGCATCCTCGACCTCCCACGGTCAAG +TGATCCTCCCACCTCAGCCTTGTGAGTAGCTGGGACCACAGACATGCACCATCATGCTTG +GCTAATTTTTTTTTTTTTTTTTGAGACTGAGTCTATCACCCAGGCTGGAGTGCAGTGGTG +CGATCTCGGCTCACTGCAACCTTTGCCTCCCAGGTTCAAGTGATTCTCGTGCCTCAGCCT +CCTGAGTAGCTGGGATTACAGACACCCACCACCATGCCCAGTTAATAATTGTATTTTTTT +TTTAGTAGAGACGGAGTTTCACCGTGTTGGTCATGCTGGTTGAGAACTCCTGACCTCAAG +TGATTCACCTACCTGGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCACGCCCG +GCTCTAATTTTTGTATTTTTAGTAGAGACAGAGTTTCGCCATGTTGGCCAGGCTGGTCTT +GAACTCCTGGCCTCAAGGGATTCACCCACCTGGGTCTCCCAAAGTGCTGGGATTACAGGT +GTGAGCCACCCACCACGCCAGCCTTAAATCACACTTTCAACTTCACTTCCTTTAGATACT +TGCACTTCAACTGAGTTCACCGGCTGCAGGCCTGCGGAGTTACCTTTGATATTTATCTGT +CCACTCCAGTAGCAAAGGGGCTATGTCTGAGTGAATCGTCCTTTTCTTTCCATTCTCCCC +CCTCATGTACCCTCAACCCTTCATTCTTTCCTCACGTGAACACAGCACAGTTGAGGCCCA +GTTGTGGGTCAGTGCTAACGTGCAAGACTTAAAAAAAAATTTTTTTTTAATTTTTATTTT +TAGAGATGGAGTCTTGCTCTGTTGACCATGCTGGAATGCAGGGGCATAATCACAGCTCAC +TGCAGCCTCAAAATCCTGGGCTCAAGCGATCCTCCCACCTCAGCCTCCCAAGTAGCTGAG +ACTACAGATGCATGCCACCATGCATGGCTGATATTTTTGTTAGTTTGTTTCGAGGCAGGA +TCTCACTCCCATCACCCAGGCTGGAGTATTGTGGCACAATTACGGCTCACTGCAGCCTCG +ACTTCCCTGGGCTCAGGTGATTGGCCCACCTCAGTCTCCCGAATAGCTGGGACTACAGGT +GTGTGCCACCATGCCCTGCTAACTTTTTGTATTTTTAGTAGAGACAGGGTTTCACTATGC +CCAATTTGGTCTCAAACACCTGGGATCAAGTGATCTGCCCACCTCAGCCTCCCAAAATGC +TGGGATTACAGGCGTGAACCACTGTGCCTTGCCTAACTTTTTCTTAATGTTTACTTTTTG +CAGAGATAGTCTCACTATGTTGCCCAGTCTGATCTAGAACTCCAGGGTTCAAATGATCTT +CTTGCCTTGGCCTCACAAAGTGCTGGGAATACAAGCATGCACCATCATGCCTAGTTATTA +TTTTTCTTTTCTTTCTAATTTTTTTTTGCACAGCTAATTATGTTGTCTACAACACCTCAA +AGCATTGGGCCCTAATGGGAATGGCTGCTCTATTATATATATACATTATACTACATTAGA +GATTTCAATCTCTTCCCCACAATTTTTTTTTTTTTTTAGATGGAATCTCGCTCTGTCACC +CAGGCTGCAGTACAGTGGTGAGATCTCAGCTCACTGCAACCTCCGCCTCTCAGGTTCAAG +CGATCCTCCTGTCTCAGCCTCCCAAGTAGCTGGAAATACAGACATGCACCACCACGCCTG +GCTAATTTTGTATTTTTAGTAGAGACAGGGTTTCGCCATGTTTCCCAGGCTGGTCTCAAA +CTCCTGGGCTCAAGCAATACACCTGCCTTGGCCTCCCAAGGTGCTGGGATTACAGGCTTG +AGCCACTGAGCTCTGCCATCCTCCCTGCAATTAATCCTGTTAGAAAGAATGAAAACCATA +CTTGGCAATGGGGCTTTGGGCAACTAACCTTCGATTTTCACCTCGGCTTCAGGGTCCTCA +TTTGGTTCTTCTGAAGGGACCAGCGGAGTGGAATCTTGAAAAAAAAATGTCTAAAATGAC +ATTCATTATTAAGTATTCTCCTCATATTCCAACACATTAATGCTCCTATACCAAAAAAGT +AGCTTATCCTGGCATTTTAAATATATTTCATATATAAATAATATAAACATAATTTTAATT +TTATAAGCAATAATAATAGGATAATAAACAGTAACTGGGCCGGGCACGGTGGCTCGCACC +TGTAATCCCAGCACTTTTGGGAGGCCGAGGTGGGCGCATCACTTGAGGTCAGGAGTTGAA +GACCAGCCTGGGCAACATGGTGAAACCCCAACTCTATTAAAAATACAAAAATTATCCAGG +CGTGGTGGCGCACGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGAGGGAGAATTGCTTC +AGCCCGGGAGGTGGAGGCTGCAGTGAGCCAAGGTCGCGACACACTGCACTCCAGCCTGGG +TGACAGGGTGAGATTCTGTCTCAAAAAAAAAAAAAAACAGAATCATTTTGGTAGTCCATG +TGTCACTATCTCTCTAAGGCAGATATATACAACTAAAAGTAAGATCACATTGCCTGTAAA +TGGCAAAGATGTCCCACGCCTCTAGGTTTGGAAAGGAAATCTTTATTATTATTATTATTA +TTATTATCATTATTGAGACAGTCTCACTCTGTCACCCAGGCTGGAGTGGAATGGTGCGAT +TTCGGCTCACTGCAGCCTCCGCCTCCTAGTTTCAAGCAATCCTCGTGCCTCAGCCTCCCG +AGTAGCTGGGATTACAGGTGCCTGCCACCACGCCTGGCTAATTTTTGTATTTTTAGTAGA +GACAGGGTATCACCATGTTGGCCGGGCTGGTCTTGAACTCCTGACCTCAGGTGATCTGCC +CACCTCAGCCTCCCAAAGTGCTGAGATTACAGGCATAAGCCACCATGCCTGGCCCTTTTT +TAAAATTATTAATTTTATCTTGGACATACACAAACCACCGTAGGAATTTAGGCTTTATTC +ATATGATGCTCAAGATTTATATATGAATGGAGGGAAGTATTATCAAATTTTACTTCTAAT +GCAAGGATTTCCTAAAATACTATTCGACTCTGTCCAAAAGAATTATGTCATGCCATCCAA +AAGACAAAGCAAGAAACAGCACCACTGCAAAGTTAACTTCCATATTCGGGTGCTTTAAGT +AGAATCACTCACAGATCAGAAGCACAAGAAGTGATAGAGCCCTTCATGTTATATCTTAGG +GCAAGAGCTCAACTATTCATAGTTTTCTGAGAAGACAGGCATGCCAGAAAGTCACCTTCC +TTATTTTCCAACTTACATGTATAAAAGAGTATGTTCTCTGTAAAATACTATAAACTTTCA +GCTGGGCATGGTGGCTTACGCCTGTAATCCCAGCACTATGGGAGGCAGAGGTGGACGGAT +CACTTGAGGTCAGGAGTTCAAGACCAGCCTGGACAACATGGTGAAATCCCGTCTCTACTA +AAAATACAAAAATTAGCCGGGCGTGGTGGTACGCGCCTGTAATCGCAGCTACTCAGGAGG +CTGAGGCACATGAATCGCTTGAACCCAGGAGGCAGAGGTTGTAGTGAGCCGAGATTGCGC +CACTGCACTCCAGCCTGGGTGACAGAGCGAGACTCTGTCTCAAAAAAGAAAAAAAAAAGT +ATGTTCTTTGTAAAATACTATAAACTTCTATAAACTTTTCTTAAAAGAGAGAGAAAAAAT +GCTGCATTTTTCTAACCTTCCATTGGTAATTCCATTTCTATTACTTCATTGCTTGTGGAA +GAAGGGTGGCTTCCTGAAAGAAAAATAAATAATATATAACAAAGGAGAAATACAAAAATG +TAAAAAGAAATCACTGAATACAATGCAAACAAGTCAATACCCACACAGGAATACACCTGA +AATACTTCTACCCCTTGAAATAAAACTGGCTGCGCGCGGTAGCTCACGCCTGTAATCTCA +GCACTCTGGGAGGTGGAGGCGGGCAGATCACCTGAGGTCAGGAGTTCGAGACCAGCCTGG +CCAACATGGTGAGACCCCTTCTCTACAAAAAAATACAAAAATCAACCGAGTGTGGTGGCA +CACGCCTGTAATCTCAGCTATTCTTGAGGCCGAGCCAGGAGAATCACTTGAACCTGGGAG +GTGAAGGTTGCAGTGAGCCATGATCACGCCACTGCATTCCAGCCTGGGCGACAGAGCGAG +ACTCTGTCTAAAAAAAAACAAACAAAAAAAACATAAACCAATTAATTTCTCTGAGTTTCT +CACATTCTGGATTTTATTGACTACATCCTTGTGGTGATGTTTTCATATGTGCCTGTATTC +CATGCATCTCCTAAAAACTGCTGGTTAGATCTAAAGGCTGGATCAGACTTAGGTCTGATT +GTTTTGTTTTGTTTTGTTGTTGTTTTGAGAGAGAGTCTCACTCCAGCACCCAGGCTGGAG +TGCAGTGGTGTGATCACAGCTCGCTGCAGCCTTGACCTCCCAGACTCAAGCGATCTTCCC +ACCTCAGCCTCCCAAGTAGCTGGGGCTACAGGTGTGTGCCACCATGCCCGGCTACTTTTT +GTATTTTTTGTAGAGACGGCGTCTCACCATGTTGCCCAGGCTGGTTTTGAACTCCTGGGC +TCAAGTCATACACCTGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGTATGAGACACTAC +ACCTGGCCAGGTTTGATTTTTTTTTTTTTTTTGGAAGAATCCTTGACAAAGGTGGTGTGG +TGTACTTCCTACTGGATACCGTCAGGAGACCAGTGACCAGTCAGTTCAGGAACTGTCAGT +CAGGTCTGCCCATGATAAAGTCCCCATCAGACTTTTATAAAATGGTTTTAATGACCACTG +ACAATTATTGCCAAGATGCACTGCTTCATTAGGTGGTGCAAAATCATGACAGTCGTGACA +ATTTATGACTTCTTTTTAAAAGCCTTATGGGTCAGGTGTGGCGGCTCATGCCTGTAATCC +CAGCATTTTGGGAGGCCAAGGTGAGTGGATCACCTGAGGTCAGGAGTTCGAGACCAGCCT +GGCCAACATGGCGAAACCCCGTCTCTACTAATAATACAAAAAATTAGCCAGGCGTGGTGG +CACACGCCTGTAATCCCAGCTCCTTGGGAGGCTGAGGCACAAGAATCATTTGAACCCAGG +AGGCAGAGTTTGCAGTAAGTGGAAATAGTGCCACTGAACTCCAGCTTGGGCAACAGAGTG +AGATTCTGTCTCAAAAAAAAAAAAGAGTATGTGGATTTAGCCCAGGCATGGTGGCTCACG +CCTATAATCTCAGCACTTCTGGAGGCCAAGGCTGGAGGACTACTTAAGCCCAGGAGTTAG +AGAACAGCTTGGGCAACAAGGTGAGACCTCATCTCTGTAAAAAAACAAACAAAAGAGTAC +GTGGATTTAGGCTAAATAGAATCTATTTTATAACTGTAGGATTATTTACTCTAAATGGCA +GCATGCTAGATCCTAGGTAAACACACATGGGTGCTCGCCAGTTTTTCAGACAGGTAGTAA +TTAAAATCTTCCATCCCAAATAACTTTTGGGGAAGAAAATTATTATCAAACAGTATTACC +TTGCATATTATATTGATAGTAATTAGGATCTTCTGATTCTTTCTTGACTGAGACAGCTTC +TGCTTTCAGTGAAATGCCTTGGAATGTAATGGAAATGATAAAATTGTATGTTAGGTTAAG +TTTGCCAACAAAGAAATACGACTAGCTAATATAAGTTGATTAATACAGCAATGTTACAAT +CAGCAAAAGAACTTGTAGCTCACTCACTATGAACAAATTTGACCTCTTGATACAAAAATA +GAAATACTATAAATTAAAATAATATACATATAGAAAACATACATTTGTGTATTTATGTAT +GTTTATATAAAAATAATATCAATTGTAAAATCAATAGAAAAGGAAAGAAGGAAGGAGGGG +ACCGGGCACGGTGACTCACGCCTCCAATACCAGTACTTTGGGAGGCTGAGGCGGGCAGAT +CACTTGAGGTCAGGAGTTTGAGACCAACCTGGCTAACATGGTGAAACCCTGTCTCTACTA +AAACTACAAAAATTAGCTGGGAGTGGTGGCGGACGCCTGTAGCCAGCCACATGGGAGGCT +GAGGCAGGAGAATTGCTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCTGAGATCGAGCCA +CTGCACTCCAGCTGGTTGATAAAGCGAGACTCCATCTCAAAAAAAAAAAAAAAAAAAAAG +AAAGGAAGGAGAGGAGGATGAAGGAAGGCATCGTGAAGGCGGGAGAGCTTAGTTCTGATT +CTAGTCCTAGTTTTGGGAGATTTTCCCCTTCAGGGTGGCTGAATATCCACGTGCATTTAC +ATGAAATGCTGTGAAGATTCTTCTGTCATGAAGCCTGAACTGACATATATAACCATTTTT +TTTTTTTTGAGACAGAGTCTCACTCTGTTGCCCAGGCTGGAGTGCAGTGGCATGATCTCG +GCTCACTGCAACATCCACCTCCCAGGTTCAAGTGACCCTCCTGCCTCAGCCTCCCAAGTG +GCCCACGCCACCATGCCTGGCTAATTTTTGTATTTTCAGTAAAGACGGGGTTTCACCATG +TAGGCCGGGCCGGTCTCAAACTCCTGACCTCAGGTGATCCACCCACCCACCTTGGTCTCT +CAAAGTGCTGGGATTACAGGCATAAGCCACCGTGCCCGGCTAGGCACTTATAATCTTAAC +TTACTCACTATAATGGAATGGATTTCAAAACCTGGAGAAGCTATATCAGTACAACCTAAT +GCCTTTATCAGAGAAGGGTGCGGTTGGCTGCAAAAATTAGCTCAAGACCTCTCCCATCCC +AGGATGTACATCCCTTTGCAATGTGACTATCCCATGCTTCTTTTCTAGAAGTAAAGTCTG +TTTCTCTGCCATTTTGTTATTATTTTTTGAGACAGAGTCTTGCTCTGTTGCCCAGTGGAG +TGCAGTGGCATGATCATGGCTCACTGCAACCTCTGTCTCCTGGGCTCAAGCGATCCTCCT +GTCTCAGCCTCCTGAGTAGCTGACTATAGGCATGCATCACCACGCCTGCCTAATTTTTGT +ATTTTTTGTAGACATGAGGTTTCACCATGTTACTCAGGCTGGTCTCGAACTCCTGGACTC +AAGCAATTTGCCTGCCTTGGCCTCCCAAAATGTTGGGATTACAGCTGTAAACCACGGCGC +CAGGCCATTCTCTGCCCTTTAAATCTGGCCCTGGCTGTGTGACTTGCTTTGGTCAATGGG +ACATCAGCCGATGGGATGCAAAGAGAGGCTTGAGAAGAGCTTGATCATCTGTGCCTGCTG +CTTCTAGAACCTCATCACCATGGGAGCCAGCCTAGGGTGCCTCCAAAGGGTATGAGGCCA +CAAGGAGAGAGACCCTGATGTCCCAGCCGGGGCCTCAGACACACAGCCATCCGGCCCTTG +CTGAGCCAGTCCAGCCAACACACAGAAATGTAGGAAAGACTAAATATTCCATTCCATTCC +ATTGGAGCCCTTCCCCTTCTCTTTCCAGCCCAGGCTGGAGTGCAATGGCATGATCTTGGC +TCACTGCAGCCTCCACCTCCCAGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCAAGTAGC +TGGGACTACAGATGCGCACCACTACGCCTGGCTAATTTTTGTATGTTTAGTGGAGACAAG +GTTTCACCACGTTGGCCAGGCTGGTCTCCAACTCCTGACCTCAGGTGATCCGCCTGCCTT +GGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGCCACCACACCCAGCCTCATTTCAGGGG +TACTTTTAAATACAGCAATAGATGACTGATACTAAAATGTACATGTAATTTAACCATGAA +TGTTTGTAATAGCAAAACAAAAAAACTGTGGCATAGCTTGGGGTTCATTGTTTAACATAA +TTTATAAGTTCTGAGGGGTCGTCTGAAAACCTTTAACAGCTCTGTTGGTATAAGGACAGT +GAAGCTAAACATTTAAAAATCTGATTTTCAGCTGGGGACAGTGGCTCAGACCTGTAATCC +CAGCACTTTGGGAGGCTAAGGTAGGCAGATCATTTAAGGTCAGGAGTTCGAGACTAGCCT +GAACAACAGGGTGAAAACCCGTCTCTATTAAAAATACAAAAACCAGCCAGGTGTGGTGGT +GGGCACCTGTAATCCCAGCTACTCGGAAGGCTGAAGCAGGAGAATCGCTTGAACCCGGGG +GGGCGGAAGTTGCAGTGAGCTGAGATCACACCACTGTACTCCAGTCTGGGCGACAGCGAG +ACTCTGTCTCAAGAAAAGAAAAAAAAATTGGCCTGGTGCGGTGGCTCATGTCTGTAATCC +TAGCACTTTGGGAGGCCGAGGAGGGTGGATTACCTGAGTTCAGGAGTTTGAGACCAGCCT +GGGCAACACGGTGAAACCCTGTCTCTACTAAAATACAAAAAAATTAGCCAGGTGTGACGG +CGTGCACCTATGATTCCAGCTACTCAGGAGGCTGAGACAGGAGAATCACTTGAACCTGGG +AGGCAGAGGTTGCAGTGAGCTGAGGTCGTGCCACTGCACTCCAGCCTGGCAAGACAAGAA +AGAAAGAAAGGAAGGAAGGAAGGAGAGAAAGAAAGAAAGAAGGAAAGAAAGAAAGAAGGA +AAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGAAAGA +AAGAAAGAGAAAATAAATTAAAACCAGGGAGATGGTTTGTTTTTGTAGCAAATGCTACAC +ACATATCACAAGAAATAAGGACCAATTGAGGACCAGCTCTCAGGAGCCTGCTGGCAGCTG +GTAGCAATCCATATCGCTTTATAAAGTCTACAGTAGGAAGTTTTGTGAATAAGGAAGCAT +ATTTTTGTTCAAATGAAACCACATCTCCAACAAAGGCACGTGAGAACCACAGATCTAGCC +CAACAGCTAGTGAGGAAGGAAACTCGGCCCCTGGGGACACTGATCACTTCTCACTCTCAC +CCCCTTCATCTTCCCAGGTTCTTTCTTTTTTCTTTTTTTCTTTTCTTTTTGAGACAGTCT +TGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGCCATCTTGGCTCACTGCAACCTCCACCT +CCTGGGTTCAAGCAACTGTCCTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGCATGCA +CCACCACGCCCAGCTCATTTTTGTATTTTCAGTAGACATGGGGTTTCACCATGTTGGCCA +GGCTGGTCTCGAACTCCTGACTTCAGGTGATCCGCCCACCTTGGCCTCCCAAATTGCTGG +GATTATGGGCGTGAGCCACCGTGCCTGGCCTCATCTTCCCAGTTTGTATGTGGAGCCTGT +GGCTTGGGGTATTCTTTTAATTCTCTGTGACCAGGTAAGACACAGGCAGAAGATATCTGA +GCTCTGAAAACATCCAAGGCTAATATTGAGTGGGCAAGAGTTTGAGGCCTGTCACGTCAG +AAACGAGACCAAGATTCCACAGCTGACCTGTGCTCACAGCTGAATTGTGCTGAGCTGAAA +TACTGCGCCCGTTTCTTTCCATTCAACTTGTCTTGGTTTGACCTAGAACCACACTGCACA +GGAGAAGCACCATTTTTTGTTCAGACTCTCATCTGAAGCTGGAGCTTCTGCTAAGCACTT +GTTTGCATGGGAGTGGAAGGGGACATGTGCACCCACAGTTGTGGCGAAAAGATCCTTGGG +TGTGACAAAGGAGGAGGCGGGCCAAGGAGACCCATCCACTGTGTCCCTGGACCCTCCCAA +GGAATCCCAGGAACTGCGAAGCATAAACCACATCTTCACTGTCTTAGAGACGCTGCTGTC +CTTCCTTCATTTTACTCATGCTAAAGGCTCTATTTTTCTTTTCTCTAGAACTTTCTTTCT +TTCCTTTTTTCTGAGACGGAGTTTCACTCTCACCCAGGCTGGAGTGCAATGGCGCAGTCT +CGGCTCACAGCAAACTCTGCCTCCTGGGTTCAAGCGATTCTCCTGTCTCAGCCTCCCAAG +TAGCTGGGATTACAGGCGTGCGTGGTGGCGCCTAATTTTTGTATTTTTAGTAAAGACAGG +GTTTCACCATGTTGGCTAGACTGGTCTCAAACTCCTGACCTCAGGTGATCTGCCTGCCTC +CGCTTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACTAGACCCAGCCAGGTCTTTGTTT +CTTAACACAGAATATTGTTTTTCTTTTGGATTATGATTATTATTCTTTGAAGCCAGGGTC +TCGCTCTGTCACCCAGGCCGGAGTGCAGTGGTGCAATCATGGCTCACTCCAGCCTTTATC +TCCTGGGCCCAAGTGATCCTCCAACCTCAGCCTCCCAAGTAGCTGGGATTATAAGTGCGT +GCTACGATGTCTGGCTAATTTTTTATTTATAAATATTTTTTGTAGAGACAGGGTCTCGCT +TTGTTGCCCAGGCTGGTCTCAAATTCCTGGACTCAGGCGATCCTCCTGCTTCAGCCTCCC +AAAGTGCTGAGATTACAGGCGTGAACCTTTCAACTTTTAATGCTTTCAGTATTTTCCCAT +CCCTTGATTGAACATTTGGGTTTTAAATTATTTTTGTTGTTGTTGTTTCTTTTTGAGACA +GAGTCTTGCTCTGTCACCCAGGCTAGAATGCAGGGGTGTGATCTCGGCTCACTGCAACCT +CTGCCTCCTGCGTTCAAGCGATTCTTGTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGG +CGCCTGCCATGATGCCCAACTAATTTTTTGTATTTTTAGTAGAGACAGTGTTTCACCATG +TTGGCCAGGCTGGTCTCAAACTCCTGACCTCAAGTGATCCGCCCACCTTGGCCTCCCAAA +TTGCTGGGATTACAGGTGTGAGCCACTACACCCGGCCTAAGCTTTTTTTTTTTTAATCTT +AACCTGTTAACATTTTTCCTCTAATTAATGCTGGTTTTCTTTTATTGAGGAGTGAGGAGA +AGCAAGAATGGGGTCAACCCCATTGAAGAGGGATTTTTTTTCCAGTATACACTGTCATAG +TAATGTACCTATATTGTAAAACATTTAGAAATGACAGAAAAGTCCAAAAAAGCAGTAGTA +TATGTCCAAAAATGAAAACACTGCTCTATTTGTGAGTCAAGTAATAATTCCAAATTTATA +TTCAAAATGTTTTACTCATTTCAAATTCAGGTTCTCATTCAACTATAAATAAAATAATAT +TCTGTCCAAAAGTATGTGTATTTAATAACATCTTAGTCCCTATTATGTACTGAATTAGAA +GGCTCCCTCTCTCTCTCTCTTTTTTTTTTTTTTTTTTTGAGACAACGTCTCTCTCTGTCA +CCCAGGCCGGAGTGCAGTGGTACCATTACAGCTCACTGCAGCCTCAACCTCCTGGGCTTA +AGCGATCCTCCCACCTCAGCCTCCTGAGTAGCTAGGATCACAGGCATGCACCACCATTTT +TTATATGTTTTGCAGAGATGAAGTCTCGCCATGTTGCCCAGGCTGGTCTTGAACTCCAGG +GTTCAAGCAATTTGCCTGCCTCGGCCTCCCAAGGTGTTGGAGTTACAGTCGTGAGCCCGC +ACACCCTGCCAAGGCTTGTTTTCTAGATATTTGAGTAAAATAATGGTTCTGCAAATGAGG +CTCCACTGAGGTTAATTCACGCCCTGGTCTTTATTTATTTATTTATTTGATAAAACAAAA +GAAAGGTGTCAAATGATAACCTGCTAGATACTTGGTTCTTTTTTTTTGTTTTTTTGTTTT +TGTTTTTGTTTTTGTTTTTTTTTGACACAGAATCTCACTCTGTAGCCCAAGGTGGAGTGC +AGTGGTGCGATCTTGGCTCACTGCAACCTCCACCTCCCGGGCTCAAGCAATTCTCATGCC +TCAGCCTCCCAAGTAGCTGGGACTACAGGCGCACACGAACATGCCCAGCTAATTTTTTGT +ATTTTAGTAGAGACAGGGTTTTACTATGTTGGCCAGGATGGTCTTGAACTCCTGAGCTCA +GGCGATCTGTCCGCCTCAGCCTCCCAAAGTGCTGGGATTACAAGCGTGATCCACCGTGCG +CAGCCTTGTTTGTTTTTTTGAGACAGGGTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTG +GCGCCATCTCAGCTCACTGCAGCCTCAGCCTCCCAGGTCCAAGCAATTCTCCTGCCTCAG +CCTCCCTGGTAGCTGGGATTACAGGCACGCACAGCCACGCCTGGCTAATTTTTGTATTTT +TAGGAGAGACGGGGTTTCACCATGTTGGCCAGGCTGGTCTTGAACTCCTGACCTCAAGTG +ATCCGCCTGCCTCGGCCTCCCAAATTGCTGGGATTACAGGCGTGAGCTACCACGCTTGGC +CGATACTTGATTCTAAAAGCATCTTGGTACCCACCAGAATCTTCCATGGGTTCAGTTTTC +ACATTGATGGGGCCGCAGCTGCAAGGAGAAGGGAACCCTGGTCAGATGGGCAGGGTGAGG +ACCAGGCACAGCCGCCTGGACACGATGAGCTCAAATGCCCTGGATCTCCGCAGCACCAAA +TCCCCCTCCTCCCCTCAATCAAATGCAACAATGCCTCCATTTTAACATTAATGTCTTAAT +AAGTTGTTCCCAAATTAAACGTGTCTACCGAAAGTAGTCTTCTAATTCCAAAGGTCCTTT +TGGACAAAGAATAGGATAGAAAATAAGGAAGGGAAGAAGCACATTAACCCTTTACACTCC +ACTTAAATGCTGTAAGGAGGCCTTTCTGTCATCCAAAAACGAACGCTGTGCATAGTTGTG +GATTTTGGTTGCTGTGATTTATCTTTTACCTTTCACTTGGTGATACTATGGATCTCTCCG +C diff --git a/paraphase/data/ncf1/ref.fa.fai b/paraphase/data/ncf1/ref.fa.fai index 237e259..eff27d4 100644 --- a/paraphase/data/ncf1/ref.fa.fai +++ b/paraphase/data/ncf1/ref.fa.fai @@ -1 +1 @@ -chr7_74768800_74792800 24001 24 60 61 +chr7_74760000_74820000 60001 24 60 61 diff --git a/paraphase/data/neb/neb_config.yaml b/paraphase/data/neb/neb_config.yaml index ed67f38..1e32e8f 100644 --- a/paraphase/data/neb/neb_config.yaml +++ b/paraphase/data/neb/neb_config.yaml @@ -18,4 +18,4 @@ coordinates: left_boundary: 151578800 right_boundary: 151588500 - noisy_region: [[151584195, 151584196], [151578903, 151578903], [151579992, 151580022]] + noisy_region: [[151579992, 151580022]] diff --git a/paraphase/data/pms2/pms2_config.yaml b/paraphase/data/pms2/pms2_config.yaml index e52556c..cc55367 100755 --- a/paraphase/data/pms2/pms2_config.yaml +++ b/paraphase/data/pms2/pms2_config.yaml @@ -10,7 +10,7 @@ data: coordinates: hg38: nchr: "chr7" - nchr_old: "chr7_5967000_5992500" + nchr_old: "chr7_5957000_6010000" nchr_length: 159345973 extract_region1: "chr7:5970000-5989062" extract_region2: "chr7:6735630-6754792" diff --git a/paraphase/data/pms2/pms2_ref.fa b/paraphase/data/pms2/pms2_ref.fa index 7dd6516..f365893 100644 --- a/paraphase/data/pms2/pms2_ref.fa +++ b/paraphase/data/pms2/pms2_ref.fa @@ -1,427 +1,885 @@ ->chr7_5967000_5992500 -CTCTTGCCTAGTGGTGTTGCCATCTTGTTTGGAAAAGTCTAGATTATCAGAGAGAGATGA -GGGAGAGCGGGCAGACTTCTCCCCTTTTTTGTCTGCTTTTTTCTTTTCTTTCACCATTGC -CTTGGGAAGATCCAATGGTTACTTGAATCAAATGATTTCTTTGGTTCAGAGCTGCTTGTT -TCAAAGCACTGATGAGTTTTATCTGAAAAATAAAAATTACGTCTCCAAACACTTGGGGTT -TTCATTTGTAGTTAAAATTTCAGTTTTACAACACAATGTCATTATCATTCTCCTGACAAA -GTCTGAAAAATTAGTTACCAGGGCCGGGTGTGGTGGCTCACACCTGCGATCTCAGCACGT -TGAAGGGCCAAGGTGGGAGGATCATGTGAGTCCAGGAGAGGGAGATCAGCCTAGGCCACG -TAGTGAGATGCCACCTCTCTACAAAAAATAAAAATAAATTAGCCAGGCGTGGTGGCACAT -GCCTGTAGTCCCAGCTACTAGGGAGGCTCAGGTGGGAGGACTGCTTGAGCCTGGGAGGTC -GAGGCTGCAGTGAGTAGTGTCACACCACTGCACTCCAGTCTGGGTATCAGAGCAAGACTC -TGTCTCAAAAATGACTATAATTACAAGTTTCAAGTACCATCAGTTTATAAAAATACAACC -TCAACATCGCATTGCTTGTTCCTAAAATTTTTTTATTTTTAATTTTTGAGACAGAGTCTC -ACTCTGTCACCCAGGCTGGAGGGCAGTGGCACAATCACAGCTCACTCTAGCCTCAACCTC -CTAGGCTCTGACGATCCTTCCATCTCAGCCTCCCAAGTAGCTGGGACCACAGGCATGCAT -TACCACACCTGGCTAATTTTTTGTAGAGACAGGGTCTTGCTATCTTGCCCCGGCTGGTCT -GGAACTCCTGAGCTCAAGCAATCCGCCTGTCTCAGCCTCCCAAAGTGCTGGGATTATAGG -TGTGAGCCACTGTACCTTGCCCCAAAAATTATTTAAGTTGGAACCATTGTCTAGCATTGT -TTCTTGAAAGGTAACCCTACACATGAAATAGGCTACTTCACCTCTCAGGTCTTGCATGCA -GCCAATTCACACTTTAAAAGCCCCTCTCTGGCCGGATGCAGTGGCTCACACCTGTAGTCC -CAGCACTTTGGGAGGCCAAGGCAGGTGGATCACGAGGTCAGGAGATTGAGACCACCCTGG -CTAACACTGTGAAACCCCGTCTCTACTAAAAATACAAAAAATTAGCCAGGCATGGTGGCA -CATGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCACTTGAACCCAGGAG -GTGGAGGTTGCAGTGAGCCGAGATCACACCACTGCACTCTAGCCTCGGCAACAGAGCAAG -ATTCTGTCTCAAAAAAAACAAAACAAAACAAAAGCCCCTCTCCTTATAGGTCAGCATTGT -AAAGTGTGCAAGAGCTGGATTCGGAGTCCTGCATTGCCCATTACCAGTTCTATGGGTTTG -TTTATTTATTTATTTATTTATTTTTGAGACGGAGTCTCACTCTCTTGCCCAGGCTGGAGT -GCGGTGGTGCGATCTTGGCTCACTGCAAGCTCCACCTCCCGGGTTCATGCCATTCTCCTG -CCTCAGCCTCCTGAGTAGCTAGGACTACAGGCGCCCACCACCACACCTGGCTAATTCTTT -TTGTATTTTTAGTAGAGACGGGGTTTCACCGGGTTAGCCAGGATGGTCTCAATCTCCTGA -CCTCGTGATCTGCCCGCCTTGGCCTCCAAAGTGCTGGGATTACAGGCGTGAGTCACCGGG -TGTGGGTGCCCGGCCCAGTTCTGTGTTTTTTGGGTTTGTTTTTTTTTTTTTTTTTAGACA -GACTCTCTAGCCCTGTCCTGCAGGTTGGAATGCAGTGGCAGGATCTTGGCTCACTGGCTC -ACTGCAACCTCACTGCAGGTTCAAGTGATTCTCCTGCCTCAGCCTCTCGAGTAGCTGGGA -TTACAGGCACCTGCCTCCATACTCAGCTAATTTTTGTATTTTTAGTAGAGATGGGGTTTC -ACTGTGTTGGCCAGGCTGGTGTCGAACTCCTGACCTCGTGATCTGCCCGCCTTGGCCTCC -CAAAGTGCTGGGATAACAAGTGTGAGCCACCGTGCCTGGCTGGTTTCCTTTTTTTTTTTT -TTTTTTTTTTTTTTTTTTGAGACGGGGTGTTGTACATTTTGCCCAGGCTGGTTTCAAACT -CCTGGCCTCAAGCAATCTTCCCACCTTCTCCTCCCAAAGTGCTAGGATTGCGGGCATGAG -CCACTGAGCTCGGCCAAGTGCTGTGTTCTGAAGCAAGCTGCTTAATCTCCTCTGCCTCAC -AAATAGAAATAACAGAACCTTGTCTCATAAGAATTAAACCGATGACACACAGAAAAATCC -CTAAGTACAGGATACAGAGCAAAGTCAATAAATTGAGTGATTATCTCGTCCCTTTCCTGT -TTTCAAACTTGAAATCATTGGTTTCCCACTCCCTCTAGCACTGCCATCGATTGAGTGCCT -CTCATATGCCGGACAAGCAAGGACCGGTGTGCTGGAGTTGCGTTTCCAGCGCATGGTTGC -TTGAGCTGTATTTCCAGCGCATCGTTGCTCGAGCTCCGTTTCCAGCGCATATCTTTGCTT -GTCTGGCATATGAGCTGCGGTGCAGGGTTTCAAAGCCATAGTTTTCATGGCTTTCCTAAT -CTGGCCCCGCTGAAAGCACCCTGGTCCATCAGGCAGGATGCATAGGTGAGCCCTGTGGTG -AAGGCCAGGTCTGGTCCCTTTTCGTAGGCCCCGACGGGTGCAGTGGGCACTTCTTGCCCT -CTTCTTCCTGGATGCCATCCTCTGGACACCCCACCCTCCAGCTGAACCCATCTCCAGCCT -TCTCTCTTCCTCCATTATTTATTTATTGAGACAGGGTCTCGCTCTGTCACCCAGGCTGGA -GTGCAGTGGCACAGTCTTGGCTCACTGCAACCTTCCGGGTTCAAGTGATTCTTCTGCCCT -AGCCTCCCAAGTAGTTGGGATTACAGGTGCCTGCAACCACTCCCGGCTAATTTTTGTATT -TTTAGTAGAGCCAGGGTTTCACCATGTTGCCCAGGCTGGTCTCAAACTCCTAACCTCAGG -TGATCCGCCCGCCTCGGCCTCCCAAAAGTGCTGGGGTTACAGGCGTGAGCCACCGCGCCC -GGCCAAGCCTTCTCGCTTCCTTCCAACACCCTTGCTCCTTCCCGCCCCCGACTACTGTCT -CAGCGAAGCCGCCCCTGGGTCCCCTAGCCCAAGGTGCTCTCACCTCTAAATTTAGAGGGG -CCTTTACTACGAGCTTTTCGGTCTTCTGTCAGTGATCTACAAATAAGTGAACTACAAATC -AAGCCAATTTCGTTTCTCAGTGCGTTTCCTAATGTTTCCTCTGTTCTCCTGGGCTTAAGG -AGAGGCCATCTCTCTCCTGTGTCTACGGTGAGCCGGGAAGAATCGGCTCCCTGCACTGGT -CTGCCCGGCCTAGGCCCTCCTCGCCCATCACGCACGTGCTCGGGTCCTGGGAGGCCGCGT -CAGTCCGGCCGGGAAGGAGCAGGACCCAGTCGCCATGGCTGTCCCGGCGTACGCAGGACC -GCGGCCTGGGGCGCTCACCTCGCTCCAGGAGCCCAGAGACCTCGCCGGGCTCGGGCTGAG -GTGTTGCCGGGCTCTCGGCGTCCCAGACCCGGCTCCGGTCTCCAGGCAACCGCGGACGCC -GCCAGGCCCACCCTGTGCTCTTAAAGGGGCCGCGCGCCAGCGCCAAGCAGGTGTCCCGCC -CTTGCTGGTCCTGAAGGCCGGGGGAAAGGCTGGACGCTGGAGGCAGCAGGCCAGGGTTTT -CCCAGCTCTGCTAACTGCTTCATCATAAAATAGGAATAACGCAGGCATTAGTTTTCCATT -GCTGCCGCAAACAAATTACCATAAATTTAGTGGTTCGAAGCAACACAAATTTATTACCCT -ACAGTATGTAAATTAGTCCCACAGTGCTGGTTCCTTCCAGAGGCTGAGGGAGAGAATGCG -TTTTCTTGCCTTTTCCAGCTTTTCCAGAAGCGGTCCCCAACCTTTTTGGCACCAGAGACC -GGTTTCGCGGAACACAATTTTTCCATGGATTGGGGTCGGGGAGGGATGGTTTCAGGACGA -TTCAAGTGCATTGCATTTATTGTGCACTTTATTTCTACTATTATTACATTGTAACATATA -ATTAAATAATTCTACAACTCACCATCACAGAGACTCAGTGGGAGCCCTGAGCTTGTTTTC -CTGCAACTAGACAGCCCCATCTGGGGGTGACGGGAGACAGTGACAGATCATCAGGCATCA -GATTCTCATAAGGAGCGTGCAACCTACATCCCTCGTGTGTGCAGTTCACAATAGGGCTCG -TGCTGCTATGAGAATCTAATGCCCACCGCTGATGTGACAGGAGGCGGAGCTCGGGTGGTA -ACGCCAGCGACGGGGAGTGGCTATAAATACAGATGAAGCTTCGCTGGCTTGCCGGCCCCT -AACCTGCTGTGCACCCCACTTCCTAATAGGCCATGGACCACTACTGGTCTGTGTCCGGAG -TGTTGGAATCCCTGTTCTAGAGACTGCTTGCAATCCTTGACTAGTGGTACCTCCTTCCAT -CTCCAAAACCAGCAAGACAGCCTCTCTCTGGCCAGCAGGGAAAGGTCTCCACCTTTGAAG -GACTCACCCAATGGACTGGGCCCACCCAGACAATCCAGGATAATCTCTCTGTTGCAAGAT -CCTTAACTCAGCCAGGCATGATGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGAG -GCGGTCGGATCACCTGAGGTCAGGAGTTCGAGACCAGCCTGGTCAACATGGTGAAACCCT -GTCTCTACTAAAAATACAAAAATTAGCCAGTATGGTTCTGGACACCTGTAATCCCAGCTA -CTCGGGAGGCTGAGGTGGGAGAATCACTTGAACCTGGGAGGCAGAGGCTGCAGTGAGCTG -AGATCATGCTATTGAACTCCAGCCTGGGCAACAAGAGCGAAACTTCATCTCAAAGAAAAA -AAAAAAAAAGATCCTTCACTCAATCACACCTGCCGAGTCCCTTCTGCCACGTGAGGCAGC -GTGGTCACAGGTTCTGGGGATTAGGACACAGCTGTCTTGGGGGCTGTTATCCTGCCACAG -CTCCCAATCTGGAGAGTTCATAAGTGGGATCCTGCAGACCACGCCAGCACAGTGCCAGAC -ACGATGGCACAGTGACTACTGTACTGCCTCCTCCATCTGAGGGATTCTAAAGCAGGAAGG -GGAGCCGCCCACAGTCTGGAGAAGGGGTGGGGGCAGCAGGGGGAGCCACATCTGTCATCT -CTGGGCCCCCAAGAGGGCATCTTTACTTCCATTTTCAGCCAAGTTCAAACAGGACAAGGT -TCCATGAAAACTATTTGAAAAGACAGACAGGGATTCTTATATTCCCAGAACCATTCAAGG -CCAGTAACTGGAATGTTCTACAGTTCACATCCTGAGGAAACCAAATCACAGCATCAAATT -ATGGGAAATCAAACTCTTTTTGTTCCCCTGCGAGGACAGCATTTTGCGACCTTGGCCGCA -CAGAGGAATGTTTCAAATAGTGACCCCTGTCCCATCCAGTCATTTTCTTCCAGCCGGGCA -GAGAATCCCCCGTGTTTAAAAATTTAATGTGAATCAGGGCTGAGAATCACTAACTGAAAA -GGACCCTACTTTTAAATTTATGAAATTAAACAAAGATGAATTTAATTATCATTAAGGGTT -GAAAGTTATAGACTAAACTATGTCCAGCCAGAGCAGAGGCCTGAGTAACTTCCAAAGTGG -TTTGGTTTTTTTTTTTTTGTTTTGTTTTGTTTTGTTTTTTGAGACACAGTCTTGTTCTAT -CTCACCCAGGCTGGAGCGCAGTGGCGCAATCTCGGTTCACTGCAACCTCCGTCTCCCGGG -TTCAAGCGATTCTCCTGCCTCAGCCTCCTGGGTAGCGGGGATTACAGGCATGCGCCAGCA -CACCTGGCTAATTTTGTATTTTTAGTAGAGGCAGGGTTTCTCCATGTTGGTCAGGCTGGT -CTCGAACTTCTGATCTCAGGTGATCCGCCGGCCTCGGCCTCCCAAAGTGCTGCGATCACA -GGCATGAGCCACCATGCCCAGCCCAAGTGTTCTTATTTTTATAAAATGTGTTCTTGCCTG -GACACACACACACGAGCGCATGCAAACATAGAGAAAAAAAATTTGCAAGCAATGCTCCAT -CTGGTTTGAAAAGGTTCTCAAGATCACTTTTAAATGGGTGTGATGTGTATTTTTTTTAAG -TAGCAGGTTCATTTTAAAACAAAAAAGGTTAGTGAAGACTCTGTCTTTCAAAACATAAAA -ATCTGCGATAAAACCAATTATTCCATACAGTGACTACGGTCAGTTCTGAGAAATGACACC -CAGGTTGGCGATGTGTCTCATGGTTGGCCTTCCATGGGGACAGTTCCAGGGGTGGTCCAT -CTCCCCCATGTGGGTGATCAGTTTCTTCATCTCGCTTGTGTTAAGAGCAGTCCCAATCAT -CACCTGAGTGTGAGACACAATGGTTCAACGTTTTAGTAGTTTTTTGACGTCAGAATGGCA -GCTCTTCAGAAGCATTCTTCTCTAAAATAAGGCTGGACAAGATTACAGCTCAAAAACTAC -CTTCCCTGAAAAACCTTCCCCCAGAGAAGCCTAGGTTCTAGATCTCAGCCCTCCACCCTT -CTGTGAAATCAGGCTCCTTGTGGCTCCTTCAAGGTGGCACCGCCTCCACTCCAGACGCCG -ACCACACCTGTCTCAGCAGCCACCCTGCCCTCTCACCCTGGCAGGTGCAGCAGCCTCCCA -GCAGGCCTCCCTGCCCCACTGCGACCCCTCCGAGCCGCTCTCCACTCAGCAGCCAGTGAT -TACTTTTAAAGGGCTGTCAGGTTATTCATTCCACTTCACAGCTCTCCCCCTCACCTGAAT -AAAAGCCCCCGTCTGTCCCCTGACTTGGCCCTCGCTGGGCTGTGCCTGCACCCCCACCTC -CAAGCACGAATGCCTCCCTTCCTCACCCCAGCTGCACTGCTACTCCCTTCCTCTTGCACA -GGCCCATCACGCAAACACCTGCCTTGGGACTGTGGCACTCCCGGGACCCTCTCCCCCAAT -GGGTGCAGGCGTCACTCCCCCTCTGTCGAGCTCCGACCTGCTGCCCATAGCACTCCAGCC -CTGGCCCTGCTGCCTCCCTGCCATGGGTCCTCTGACAGGAAGGAGAGGACACAAGCCTGA -AGCCCAATGTCACCTTCTTTCTTCCTGCAGCACCCTGAGGGCTCGCCATGTGCCAAGCAC -AGTCAGAAGGCTGGGGTGACAGCAGGTTGGAGAAGGACAGACAATCAACAAGTCAACAGA -GAACCAAGACAGGTGGCACCAGGCGAGGCGGCCTGCTCAGGTGTGGGGATGGGGTGAAGG -GTGACGGTGGCAAACCCAGGTAGAGAGGAGAGTAGGGAGAAAGGGTGTAAGGCAGGGAGG -AGACTGAGGCGAGCGTGGAACTGGAAGGCAGCTACATGGCTGGAAGCTACATGGTGGGGA -GATGGGGCTGGAAGGGTGGGCAGGGCTCAAAGCAGGAGCCTCCTGGGCAGGCAGTGACAA -CACCGGAGATGGACGGGTAGGCCAGGGCGAGAGGGAAGGAGCAGCCTGTGGTTCCCCGGG -CCACTGAGTCACACTAAACTCAGGACATCAAAACTGCCCGGCTATGAGCTCAGCTCCACG -CTCTCACTCACAGACTCCAAGACTGGAAGATCCATATTATGTCTTTTATTTTGGTGAGGT -CAGGGGTGGTGGAGAGACTCTGTCTCCCAGGCTGGAATGCAATGGTGCGATCTCAGCTCA -CTGCAACTCCGCCTCCCAGATTCAAGCAATTCTCCCGCTTCAGCCTCCCGAGTAGCTGGG -ATTACAGGCGCCCACCACCATGCCCAGCTAATTTTCGTACTTTTAGTAGGGATGGGGTTT -CACCATGTTGGCCAAGCTGGTCTCAAATTCCTGACCTCAGGTGATCAACCCACCTCCGCC -TTCCAAAGTGCTGGGATTACAGGTGTGAGCCACCACGCCCAGCCCCTATTAGGTCTTTAT -CCAAGAAACACTGTGGCTAGAAGTCAGACTCTGGGCCCTCTTCTAATTAAACTCTGCCCT -TGAGTCATTTCATCTAATCTCATGGCTGTAAATTACACCTGAAGCTCACACAGCAGGCTC -CATCCCACCCACTCCCCACGTGGCCCCCAGCTGCTGCTCTCCTCAGCGGCCGCAGCCACC -GCACCCCTTCCAGTCTGTTCTCTCTCCAGCAGCTGCAATCACGGGACTCCTTCCCGTCTG -TTCTCTCCAGTGGCTCGTGCCACACACAGCACAGACCCCCAGGGTCTAGGTATGACCGGC -AACACTCTACGTGGCTGTCCTCTGGACGCCGCTCTGCTCACTCCCTTCCCCTCTCCAGGG -ACACAATCAGCCTCTGGCTTCAGTCTTGCTACTTCCTTCGCTTGGAAAGTTCTTACCCAA -GAGGGCTCCATTCTACCTTTTTTTTTTTTTTTTTTGAGACAAGGTCTTACTCTGTCACCC -AGGCTGGAGTGCAGTTGCGTGATGTTGGCTCATTGTAACCTCGACCTCCCTGGCTCAAGT -GATCCTCCCACCTCAGCCTCCTGAGTAGCTGTGACTACAGGCACATGCCACCACACCTGG -CTAATCTTTTAATTTTTTGTACACATGGGGTCTGCCTGTGTTGCCCAGGCTGGTCTCTTA -ACTCCTGGCCTCAAGCAATCCTCCTGCCTTGGCCTCCCAAAATGCTGGGATTACACGTGT -GAGCCACCATGCCTGGCTTCCATCCCACCTTTTAGATGGCAGCTGAGATGCCACCTGCCC -AGATGCCATTCCCTGACCACCATCTCACCTGGTCACCATGTTTTTCTCTTGTCATTTCCT -GCCCCAAAACGCTGTTTTAGGCCAGGTGCGGTGGCTCACGCCTGTAATCCCAGCACTTTG -GGAGACCAAGGCGGGCAGATCATGAGGTCAGGAGATCAACACCAGCCTGACCAACATGGT -GAAACCCCATCTCTATTAAAAATATAAAAATTAGCCAGGTGTGGTGGGTGCCTGTAGTCC -CAGCTACTTGGGAGGCTGAGGCAGGAGAATCGCTTGAACCTGGGAGGCGGAGGTTGCAGT -GAGCTGAGATCACATCACTGCACTCCAGCCTAGTAACAGAGCGAGACTCCGTCTCAAAAA -CAGACAAAGAAAAATGCTGTTTGAATCTCTTGACTGTGCTTACTGGCATCTAATGCGTGT -CATTTATTTGTGGTGATGCCTATTTCTCCCCACTGTCTGCTCCACAGGGGCAGGGGCTGC -AGCCGCCTTGTTACCTCTGTGTCCCGAGCACCTGGAGCAGGGCGGGCCCCACATCAGGGG -CTCAAGGAGCACCTGCTGAATAAATAAAGGAATGGCGTCCTGGCCCTTCCCAGTGGCCAG -CTGATACACAGTCACTTTTCTTGGACATCAGGCTAATCCCCACTGCAGGCAGAACCACTG -CTGCCACCTTCCCACACCAACCGAAGCAGCGGCAGTGACGCCACGTGCAATGACAACCAC -GGCACCCCGTGAAGCACCTGCTGCCTCGATGACTCTGCAGAATCGTGTCCAATGTCGCCG -AGTCCTGGCAGCAGCAAATCTTTATCTCCCAATGTTGTTATGACCCATAAGGTCCATAGA -CGAACAAGGTACCTCAAACGCTAACTGCGTTGGAGTCAACCAAAGCTCGGAGATAGAATA -CTGGCCGGGCCAGGCACAGTGGCTCATGCCTGTAATTCCAGCACTTTGGGAGGCTGAGAC -AAGGGGCAAAAGGAGACCATGTTTCTACAAAAAATTTAAAAATTAGCTGGGCATGGTGGT -GCATGCCTGTGGTCACAACTACTTGGGAGACAGAGAGAGGAGGATCGCTTCAGCCTGGTA -CGTCAAGGCTGCAGTGAGCTGTGATTGTGCCACTGCACTCCAGCCTGGGGGACAGAGGGA -GAATCTGTCTAAAAAAAAAAAAAAGAAGAATTCTGGGTTTTTTTTGTTTTTTTGAGACGG -AGTCTCGCTCTGTCGCCCAGGTTGGAGTGCAGTGGTATGAACTTGGCTCACTGCAAGTTC -CGCCTTCTGGGTTCACGCCATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGACTATAGGC -GCCCGACACCACGCCCGGCTAATTTTTTTGTATTTTTAGTAGAGACGGGCTTTCACCATG -TTAGCCAGGATGGTCTCGATCTCCTGAACTCGTGATCCGCCCGCCTCAGCTTCCCAAAGT -GCTGGGATTAGAGGCTTGAGCCACCATGCCCGGCCAAGAATACTGCTTAACAGAGGTAAC -AAAAGAGCAATAATTATGAGTTCAAGGTCACAGAGAACGCAGACGACACAGATGCTCAGC -TACGACGCTGCACGTAGCTCTCTGTGTAAAATGACCCCTGGCAATCACAAAGGCGTTTAC -AACCTTGACCAAATCAGGAGCTGGGCTGAGACCTTCCTCGACTGCAAGCTTGAGCAGCTG -AGCTGACAGCCAGGCTTTCTTTACTTACCGACTTCCGGCAGGCTCTGGAGGCAAACATCT -GCTTGACTCGGGAAGGCCGGCACATGACCCCAGGGCTGTCGCTCAGCATGAAGATCAGTT -CATCGACGTCCTGGGGTCCGAAGGTCCAGTTTTTACTAGTTGGCAAGGAAATCAGTTTAG -CCCTTTCAGTGACTGGAGCTAAAAGAATACAATTTTGAGAAAAATCCATGACTTGACAAA -CACGTTTCACTTGAAAGCTACTTAGGATGAACATCTGAGGCCGGGCGTGGTGGCTCACGC -CTGTAATCCCTGCACTTTGGGAGGCTGAGGCCAGCGGATCATGAGGTCAGGAGATACAGA -CCATCCTGGCTAACATGGTGAAACCCCGTCTCTACTAAAAAATAGAAAAAATTAGCTGGG -TGTGGTGGCAGGCACCTGTAGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGTGTG -AACCTGGGAGGCGGAGCTTGCAGTGAGCCGAGATCGGCACCACTGCGCTCCAGCCTGGGC -GACAGAGCAAGACTCCATCTCAGAAAAAAAAAAAGTGAACACCTGAAAGAGAGGAAACTC -ACAAAATGCTTTTTGGAGGAACTTTTTAATCTTTTATAAAATTAAAAAAAACTGGTCTAT -ATGACCTGAAAGATTATTCCCAGCTCTAAAAAGACAAGAATCTATAGTTCTGATTTTTTT -TTTTTTTTGAGACAGAGTTTCACTCTTGTTGCCCAGGCTGGAGTGCAGTGACGTGATCTC -GGCTCACTGCAACCTCCACCTCCCGGGTTCAAGCGATTCTCCCACCTCAGCCTCCTGAGT -AGCTGGGATTACAGGCACCCGCCACCACGCCCGGCTACTTTTTGTATTTTCAGTAGAGAT -GGGGTTTCACCATGTTAGCCAGGCTGGTCTCAAACTCCTGACCTCAGGCGATCTGCCCGC -CTTGGCCTCCCAGAGTGCTGGGATTACAGACGTGAGCCACCACACCCAGCCGCTATAGTT -CTAATTAATAACTTACCATTTTCATCGATAACAAAATCAAAGCCATTCTTTCTAAATATT -TCCAGATTTTCTATCAGAACAGCTTCATTAACAGCAGTTAAGTTGAGAGTCTGAGGTCTG -AAAAACACAAAAATGATTCAAACCATATCCTGAAGTCAAACATTTAGCTTTACAGCAGAA -ATGAAATGAAAACAACAATACTGTATTTTGAATTCATGTCAAAATAACAACACAAATAAC -AACACTACTCAGCTAAGTGTCACAAAACTTCCTGAGAAGTTCCTTTTAATTTTCTCTTTC -TTAAAGTTCTTTTTAGAAGTTAAAGTAGCTACAGGCCAGGTGCGGTGGCTCACGCCTGTA -ATCTCAGCACTTTAGGAGCCCGAGGCAGGCAGATCTCTTGAGGCCAGGAGTTTGAGACCG -GCCTGGTCAACACAGCGAAACACTCTCTCTACTAAAAATATAAAAATTAGGCCAGGCATG -GTGGCGCACGCCTGTAGTCCCAGCTACTTGGGAGGCTTAGGCATGAGATTCGTTTGAACC -CAGGAGGGAGGCAGAGGTTGTAGTGAGAGCCAAGATCACGCCACTGTACTCCAGCCTGGG -CGACACAACAAGACTCTGTCTCAAAAAAAAAAAAAAAAAAAAAACACCCATAAAAACAAA -AATTAGCTGGAAGTGGTGGCTCATGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCACT -AGAATTGCTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCAAGATCACACCACTGCACTC -CAGCCTGGGCAACAGGGCAAGACTCTGTCTCAAAAAAAAAAAAAAAGTTCAAGTAGCTAC -AAAAGTAGTTTGCTTTTTCCTCAGCCTGCCACGCCAATGACTCCCACTTTTTCTGAATCC -TTTCCTTAAGGATAACAGTATCACAAAAATGCTATTTTTCCTCCTTCTAATACAGAATTT -GAAACACTGGGTTAGGTCATTGCCAGCATTTGTAAACAGAATGAACAGACAGCTTTTATT -TTGCTATCCTGTTCCTTCCTCTGCCTGTATTATATCTCCATCCCTCTCTCCTCCTGGATT -TACTGTTTGTTTTTTTTTAACCTTTCGTTATTTTTTTCAAAGATAGAGACAGGGTCTCAC -TATGTTGCCCAGGCTGCTCTCAAACTCCTGGGCTCAAGCGATCCTTCCACTTCAGCCTCC -CAAAGTGCTGGGATTACGAGTGTGAGCCACTGCATCTGGTCCTGAGTGCTGGATAAGACA -AACACTGCTCAAGGCAGGAGACAGCTGGTGAGCAAACACAGGCTTGGTCCTGGAGCCAAC -AGATTACCGGGGAAGAAAGACGTTGAGCAAATACTCAGGCAAGTCGATTATGATGAGAAA -CGACAGGAAGGTCAGGAAGAAAAAGCAGCCAGTGTCATAGAGAGACTTCACCCTGGGGTC -AGGAAGTGACCTTTGAGCTGAGTCCGGGGATAAGAGAGTTAATCAGGTAACGGGGGAGAA -GTGGGTGCAGGGTGCAGGACAAGTATTCTAGACAGGGACAACAATCTGTGCCAAGCCCCA -GGATGGACCGCTGATGTTTGCAGAGCCACACATAAAGATATCCTTCATTCTGCTTAGTGG -CCACATAGGGATTCATCAGGCCTGCCAAGGGAAAAAGAAAGACAGCCAGAGAGGCTTGAG -TACAGGGAACAAGGGGAAGACGAACGGGAAAAGCTACAGAGGTCAACAGGGCCACCCTAC -ACAGGGGCTGGCAGGGCAGGGTGGAACTGGGTCTTTATCCTTTAATCTTGAAGTGTGGTC -CATCTGGGACCCTAAGTGGTCTGTGATTACCTGGGCCAACTTGAAATGTCACAGATGAGA -GGTTATCTTTGCCGAATGGCTAAAAAATACAAGACCTCAGCCGGGCATGGTGGCTCACAC -CTGTAATCCCAGCACTTTGGGAGGCTGAGGTTGGTGGATCACCTGAGGTCAGGAGTTCAA -GACCAGCCTGACAAACATGGCAAAACTCCCTATCTATTAAAAATCCAAAAATTAGCCAGG -TGTGGTGGCGGGTGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATCACTTG -AACCCGAGAGGCAGAGGTTGCAGTAAGCCGAGATCACATCACTGCACTCCAGTATGGGCG -AAAGAGTGAAACTCTGTCTCAAAAACACAAAAACAAAAAACCTCTATTAAGAGGAACAGG -GAAGGGATATAAAGTAGCTTACTAAATGTCTATTATTACCATTGCCTCCTACTGAGAATA -AAAACAATTCACGCATTCCACAGGAGAGTACTCAGCAAACTACACAGGAGAGTACTCAGC -AAACTACACAGGAGAGTACTCAGTAAACTACACAGGAGAGTACTCAGCAAACTACACAGG -TTCAGTGGTACATTTCTCCATGTGGGATCTACTTGTTGGGATCTGAGTTTACTTCACTAC -GTGGTTTAATTTCCCACACGAAAATCCATGACCTCTTCTTCTAACTTTGCTGAAGACAAG -ACTTTGGTTTTACATGATACTATCACACCTGACCTTTGTGAAGTAGTCAGGGTAAAACAT -TCCAGTTTGGCCGAGGAGAGAGAAATACCAAATTCTGCAGTGACTATCTTAAAATAATTT -TTAAATTTTATTTTATTTTATTTATTAATTTATTTGTGAGACAGAGTCTCACTGTCTCAC -TCTGTCACCCAGGCTGGAGAGCTGTGCAGTGGCACGATCATGGCAGCCTCAATCTCCTGG -GCTCAAACGATCCTCCCACCTCAGCCTCCCGAATAGCTGGGACCACAGGCACACACCATC -AAGTCTGACTAATTTTTTACATTTGTTGTAGAGACAAGGTTTCACCATGATGCCCAGGCT -GGTCTCAAACTCCTAAGCTCGAGGGATCTGCCTGCCTCAGCCTCCCAAAGCTCTGGGATT -ACAGGCGTGTGCCCCTGCATCCAACCTGCAGTGACTATCTGACTTCTGATTACTCTACTG -TCAATCAACACTGGCGCACAGGCTGTCTGTCTTTCTGAACACACACATTCCATACACTAT -GCATACTAATACTCCATACTATCAATTGCCCTCATCAGAAGGATCTTCTGGCTAACCAGT -GATCAACATTTTTAATAGCGAAAAATACCTGATACTTAGAGAACATGTTAACCACGTGAA -CTGGGGCAGGTTACTCAACCTCTCTGCATGTGCCTCAGTTTTATCGCTTGTGGAATGGTG -ATGGTAACAGTAACAACCCCATAGGTTTTTGAGGATTAAAGGAACTAATACACATACATT -ATTTCAACAGTGCCTGGCAGATTCTAGGCACTGAATAAATGGTAACTATCACTATTATGT -AAAAAGTATAAAAATCTGCTATATGAATACTTATGGAAAAATACATATATACATATAGAC -ACACATATAAACTATTAGGTCTCTTTTTTTTTTTGAGATAGAATCTCGCTCTGTCACCCA -GGCTGGAGTGCAGTGGTGCGATCTCGGCTCACTGCAACCTCTGTCTCCCAGGTTCAAGCG -ATTCTCCTACCTCAGTCTCCTGAGTAGCTGGAATTACAGGCGTGCACTGCCATGCCCAGC -TAATTTTTTGTATTTTTATTTTTTATCATTATTATTATTTTTTGAGACGGAGTTTCACTC -TTGTTGCCCAGGCTGGAGTGCGATGGCACGAACTCGGCTCGCTGCAAACTCCGCCTCCCG -GGTTCAAGCGATTCTCCTGCCTCAGCCTCCCAAGTAGCTGGGACTACAGGCGCCCGCCAC -CACGCCTGGCTAATTTTGTATTTTTAGTAGAGACAGGTCTCACCATGTTGGTCAGGCTGG -TCTCGAACTCCCGACCTGAAGTGATCTGCCCACCTCGGCCTCCCAAAGTGCCGGGATTAT -AGGCGTGAGCCACCGTGCCTGGCCTTTTTGTATTTTTAGTAGAGGCGGGGTTTCACCACG -TTGGCCAGGCTGGTCTCCAACTCCTGACCTCAGGTGATCTGCCTGCCTCGGCCTCCCAAA -GTGCTGGGATTACAGGTGTGAGGCACCGCGCCTGGCCAACTAGATATTTTTTATTTTTTA -CACCCCTCCTTCCTAGATCTCTTCTTTTTTAAAGTAGATACAAGGTCTTGCTGTGTTGTC -CGGGCTGGTCTCAAACTCCTGGCCTCTTGTGATCCTCCTGCCTTGGCCTCTATTAGATCT -TCAATTTGAGGGGGAGTCTGGGAATGAACACTAAACACACTCACGCTATGAGCCTCTGCC -CCTGGAGCACGGTGTGCTGCTGCAGCATCTCGAAGTTATACTTCTCGTCCGTGGCATGCT -GGTCCACTATGAAGATATCCTCATTCAGTTTGGTTATTATAAATCCCAGGTTAAACTGAC -CAATGATTTCCATTTCTGCAAACATCGTTTTACTGCAGGTAGAAAATGTTAATTATCAGA -CATTTTACAAGATTATTTTTCTGATTATGTTATAGAACACTGTAATAAAAAAAAAGTCAA -ACAATACAAAAACAAAATAAAGTCCCTAGCCATCCCGCTTTCTTTTTTTTTGAAACAGAG -TCTCGTTCTGTCACCCAGGCTACAGTGCAATGGCACAATCTTGGCTCACTGCAACCTCCA -CCTCCCGGGTTCGAGTGATTCTTCTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGTGC -GCCACCATGCCCAGCTAATTTTTGTATTTTTAGTAGAGACAGAGTTCCACCATGTTGGTC -AGGCTGGTCTCGAACTCCTGACCTCATGATCTGCCCGCCTTGGCCTCCCAAAGTGCTGGG -ATTACAGGCGTGAGCCACTGCGTTCGGCTTAACCATCCCACTTTCTAAAGATAACATTAA -TTATTCATTCATCCAACTCTCCGGAGAAGACATCAGTTGCTACTATTAACGATTTAAATG -GAATATATCCTTCTAGACCCTTGTCTCCATATATAATTTTTTTTAATTTTAAAAAACAAA -AATGGAATCTTAATTCTCCATTCTGTCATCACTTAATGCATCTGAAACAAGTTTTCAGAC -CTGTACACATAGATCTACTTCATTATTTTTTCTTTTTTTTTTTCTTTTAAGACGGAGTCT -CACTCTCTGTTGCCCAGGCTGGACTGCAGTGGCGTGACCGTGGCTCACTGCAACCTGCGC -CTCCCAGGTTCGAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGACTACAGGCATG -CACCGCCAAGCCCGGCTAATTTTTTTATTTTTAGTAGAGACAAGGTTTCACCATGTTGGC -TAGGCTGGTCTTGAACTCCCGACCTCAAGTGATCCACCTGCCTCGGCCTCCCAAAGTGCT -GGGATTACAGGCGTGAGCCACCGCACCTGGCCTACTTCATTCTTTTTAATGGCCACATAG -GAATTCATTGCATGGATGTACCATAATTTGTCTGACAAATCCCCTACTAAAGGACATTTC -AGTTGTTTCCAATTTCAATAGCGCACTCAAAGCTGCAACAAATACTTCTGTGCATAAACC -TACTCATCTGTGGGTGCATTTCCGTGAGACAGACGCTAGAGGGAGAACTACATATGTACT -TCTTGACGGGAAATCTGTGAAAAGTCACACTCCCACCAATGGTGTGTAAGAGCACCTTTC -TGCCAATGCTGGATATCAATCCTTCTCATCTTTGCCAGGCCCACCACTGGGTCCTTTGCG -GGTGGCTTCAACATCTAATGTCATTAAATACTAACTTAGTCAATCTGGACAAAAGACAGA -CACCACCGCTAACCTTCACACGAGAAATTGACACTGTCATTCTCAGTCCCACACAATTAA -ATCCGGTGAAAATGGATTTTCCGCAGTATCAGCGCGGTGATGACAAGAAATGGCTCTGTT -AAAGCAGCCATGGACGTTTTCTGGTTCTCACCTGGTGGCCTGAGCTGAGGATGAAAGCAG -CTGTAATGTAATCCCAGCACTTTGGGAAGACAAGGTGGGCAGATCATTTGAGGTTGGGAG -TTCAAGACCAGCCTGGCCAACATGGTGAAACCCCATCTCTACTAAAAATAAAAAAATTAG -CCAGGCATGGTGGTGGACACCTGTACTCCCAGCTACTTGGGAAACGAAGGCAGAAGAATC -GTTTGAACCCGGGAGGCAGAGCTTGCAGTGAGCTGAGATCGTGCCAGTGCACTCCAGCCT -GGGCGAAAGAGTGAGACTCTTGTCTCAAAAAAAAAACAAAGGAGCTGATATTGTTGTTTC -TTTCTATAAGTGCTCCAGGAAGACCCGGTCCCATGCCACCATGCTCGTCACCATCACAAT -CAACCACAGGGGACAGTTTGGTGAACTGTGAGACCTCCACATGGCATGGATTACTGAGCC -CACATTTCCTATGGTGAGGGGCTCCACACAGAGCTCAAATCCAAGTCATAACCAAACCAG -TCCCCAAATCCTATCTTTGAGGGTCTGTTTCCTGGTACCAATTCCAGATCAGGCAGAGTG -CAATCAATCAAGAGACAAAAACCACACCAGTGATTTTAACAGGGACTTTTTTTTTTAAGA -CAGGGTCTTGCTCTGTCACCCAGGCTGGAGTGCAATGGCATGATCATAGCTCACTGCAGC -CTCAAACTCCTGGGCTCAAGTGAGCCTCCTGCCTCAGCCCCCTGAGTACCTGGGACTACA -GGCGTACAGCAATGTACTTAGCTAATTTTTTTTTTTTTTTTTTTTTTTTAGAGATGGGGC -CTCATTATATTGCCCAGGCTGGTCTCAAACTCCTAGCCTCAAGTGATTCTCCTGCCTCAG -CCTCCCAAAGTGCTGGAATTACAAGGTGTGCACCACCATGTTAGGCCTGAGGAGGAAAAA -TGTATAATAAGGCATTACACAAACTAGTAAAAGGTGGTTAACTACTATGCTAAGAAATAC -AGGAATGGAAAATGCTACTATCCTAGGGAAGAGGGAGAGTCCTCAGAAAAGGAACTCTTT -TTTTCTTTTTTCTTTTTCTTTTTTTTTTTTTTGAGATGGAGTTCGCTCTTGTTGCCCAGG -CTGGAGTGCAATGGTGCAATCTCGGCTCACCACAACCTCCACCTCCCGGGTTCAAGCAAT -TCTCCTGCCTCAGCCTCCCAAGTAGCTGGGATTACAGGCATGCACCACCATATCCCACTA -ATTTTGCATTTTTAGTAGAGAAAAGGTTTCTCCATGTTGGTCAGCCTGGTCTCGAACTCC -CAACCTCAGGTGATCCACCCACCTCAGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCC -ACCATGCCCAGCAGAAAAGGAACTCTTGTAAGAGGCTCCTACCCACTCAGGCTGAGTTTC -AGACCTCCTTGGAGCAGGAGTGGCCGCAGCCTGCTGGATGGAGAGAAGCTGCCAGAGTGA -GTGATGACACAGGAACTCCTGCCGCACAGGAGGGAAGGAAAAGAACATCCCAGAAGCATC -CCAGATGCCAGCACAAATACCACCTCCCCTGGCGCCGATCCCAGGCTCTCCCAGGAATTG -TCTGAATATGCCCTGGTTCCCAGTACATAGATAATCTGCTCAAAAGCTGGTGCTGGCCTA -AAAGACCCAAGTCTTCCATGTGTTTGGAGTCTGTGTCCTGCCACAGAGAACAGGATCTGG -CCAGGCGCAGATGCCGGAATTACAACTGCGCACTACCGCGCCCAGCCAATTTTATTGTAG -AGACGAGGTCTCCCTATGTTGTCCAGGCTGGTCTTGAACTCCTGGGCTCAAGTGATCCTC -CCTCCTTGGCTTGGCCTCCCAAAGTACTGGGATTACAGGTGTGAGCCACCACACCTAGCC -TCAAAATACTCTTAAGAAAAAACTTTACCTGGCCGGGTGTGGTGGCTCACACCTGTAATC -CCAGCACTTTGGGAGGCCAAGGTGGCTGGATCACCTGAAGTCAGGAGTTCGAGACCAGCC -CAGCCAACATGGTGAAACCCTGTTTCCACCAAAAATATAAAAATTAGCCAGGCATGGTGG -CGTGCACCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAAACGCTTGAACCCGGG -AGGTGGAGGCTGCAGTGAGCCAAGATCATGCCACTGCATTCCAGCCTGCGCAACAGAGCA -AGACTCTGTCTCAAAAAAATAAAAAATAAAAATAAAAATTTTAGATAAAAAGAGAAAAAG -TAAAAAATTAAAACTTTACCTTATCTCTTTTCTTAGTTCATCTTCGGCTGCTTGATTTTC -TCCAGGACAAATCTTTGCCCTAAACTTCCTGTAATTCTGTTCCCCTTCACTTTGCTGTGC -TTCATGATGTAACTGCTTTATTCGTTTAGCTAAAGAACTCATAGAAAAGTCCAGGGGCAC -AACTTTCTTATTAATTTTCACAGCTACATCAACCTGAGAGGCTGACATGTCCTGAGTATT -TACTAACTTTTGACAAATGTCAGAACTGGAAAGAATTTCTTCTTTTTTAAAACGCTTTGT -GTTTGGGGTTGCGAGATTAGTTGGCTGAGGCAAAACTCGAAATTTACATCCGGTATCTTC -CTGGTTTGAATGGCAGTCCACATCTGAAAAAGAGTCGTCAGTTTTAGGCGCTTTCTCCTG -AGAGTCCACATGTTCCTGCGAGCCCCTGTCCCCTGGGGAGCTGGCCGCATACTCGCTGCT -GCAGTGACTGCCCGTGTCTGGGATGCTGAACCCCTCAGAATCCACGGAAGTGCTGCCGTG -CCCCGAGTCCTTCTCCACCTCCGCTCTGTCCGTAGGGTCACTGGGTCCGTGACTGGAACT -CACTGCCTCTTTCTGAGGTCTCAGGACGCCTTTGTCAGAGATGGCACCTGAAGTGCTAGA -AGACAGCATACCCCTTTTCTGTCCTAGAGGGCTCCTTCTTGGTTCTGGAGTCTTTGGGCT -GTGAGGCTTGTTCTCTGTTGTGTGACGAAGAGAAAAGGCCTCTCGCAGTCTGGAAATGGA -CACGTCTTTTTTTTCTTCTCCAGTCCTTAATGAAGGGGATTGATCCTGCTTTTCTACCAT -GGGCTTTTCCAAATCCGCTGCATGCATTTTTATTAAGTTACCTAAGCAAACGTGGACGGA -GAAGAGGGTCAGGGACTATCCTGAAATGGTGAGAGGACGTGCTTATGTGAACAGATACTT -CACAAAAGAGGAGATCCACATGCTAATTACACAGATGAACACAGTTCAATGTTCAAAATA -AAACTATAATATGGGCCAGGTGTGGTGGCTTACGCCTGTTATCCCAGCACTTTAGGAGGC -CAAGGCAGGGGGATCACATGAGGCTAGGAGTTCAGGACTGGTCTGGACAACATGGTAAAA -CCCTGTTTCTACTAAAAATACAAAAATTAGCCGGGTGTGGTGGCATATCTGTCATCCCAG -CTACTTGGGAGGCTGAGGCACGAGAATCCCTTTAGCCCGGGAGGCAGAGGTTGCAGTGAG -CCAAGATGCCACCACTGCTCTCCAGCCTGGGTGACAGAGCAACACTCTGTCTCAAAAAAA -AAAAAAAAAAAAAAAAAAACCACAACACAATGCAATATGGCCATATACTCACCAGAATGG -TAAAATTAAAAAAACAACAAATGCTCACAAAGATCAGGATCAAGAGGAATGCCTGAATAC -CTCTGGTAGGAATGAACCTGGTACAGCTGCTTTGAAAAGTTCTCTGGGAATACCTCCTAA -ATCTGAATGTATGCACACCTGCAACCCAGCATAGCTACTCCTATCAGAAGTGCCTATTGG -CCGGCACAGTGGCTCACGCCTGTAATCCTAGCCCTTTGAGGTCAGGAGTTCAAGACCAGC -CTGACCAACATGGTGAAACCTCATCTCTACTAAAAATACAAAAAAAAAATTAGCAGGGCA -TAGTGGAATGCACTTATAATCCCAGCTACTAGGGAGAATGAGAATGAGGCAGGAGAATCA -CTTGAACCTGGAAGGCAGGGTTGCAGCGAGCCAAGATCACTCCACTGCACTCCAGCCTGG -GCGACAGAGTGAGACTCCCTCTCAAAAAAAAGAAAGAAGTGCCTATCTATGCTCGTCAAA -AAGACGTGGATGAGGATGTTCATGACAGCATTCTTCATTATAGCCCCAAACTGGAAACAA -TTCAAATATTCACAAATGATGATATCTGACTATAATGGAACACTGTATAGCGAACGAATA -AATGAATTTTGCCACATGACTTGGGTGAATCTCACAAACAAAATAATGAGAGAAAGAAAC -AAATCACAGAAAAGGACAGACTGAATAACTTCAAATTAAAAACAGATTAAACTATACCGT -TTTGGGTTTTTTTTGTTTGTTTGTCTGTTTTTTTGAGACGGAGTCTCGCTTTGTCACCCA -GGCTGGAGTGCAGTGGCACAATCTTGGCTCACTGCAAGCCCCTCCTCCCGGGTTCACGCC -ATTCTCCTGAGTCAGCCTCCTGAGTAGCTGGGACTACAGGCGCCCGCCACCACGCCCGGC -TAATTTTTTGTATTTTTAGTAGAGACAGAGTTTCACCGTGTTAGATAGTCTCGATCTCCT -GACCTCGTGAGCCGCCCGCCTTGGCCTCCCAAAGTACTGGGATTACAAGCATGAGCCGCT -GCGCCTGGCCTAAATTCTACTGTTAGAAGTCAGGAAATCCCAGCATTTTCAGAGGCCAAG -GCTAGAGGACTGCTTGAGCTCAAGAGTTTGAGACCAGCCTGGGCATCATGGAGAAACCCC -ATCTCTAATGACAATACAAACATTAGCCAGGTGTGGTGGTGGGCGCCTGTAATCCCAGCT -ACTCAGGAGGCTGAGGCAGGAGAATCTCTTGAACGTGGGAGGCTTCAAGGTTGCAGTGAG -CTGAGATCGCATCATTGCACTCCAGCCTGGGTGACAAGAGCGAAACTCCATCTCAAAAAA -ACAGACATGACAAGGGAGTTAAAAATGCAGTCACTGCAGACTTCTTCTAATCATATATCT -TATATGACTTCATCCGTTTACAGTTTACAAAAAACTAGAGGTACTTGGAGGCAGCTACTT -GGGAGGCTGAGGCAGGAAGATGGCCTGAGCCCAGGAGTGTGATGCTGCAGTGAGCTACAA -TGGCACCACTGCAGTCCAGCCTGGGTGACAGAGCAAGTCCCTGTCTCAAAAAAGAATTAA -AAATGATAAAATAATATAAGAGACTTTGTTTTCATGTCAAAAAAAAGTTTACTTGGAAAA -AATAAGGAAACACATTAGCTAAAAGCTTTAGAAGCTGTTTGTACACTGTATTTTTCTTAC -CTTCAACATCCAGCAGTGGCTGCTGACTGACATTTAGCTTGTTGACATCACTATCAAACA -TTCCTATCAAAGAGGTCTTTAAAACTGCCAACAAAAGCTTTTCCTCTTGTAGCAAAATTT -GCCTTTTATCTGGAGTAACATTGATATCAACGCATTCTAAGGCAAAAAAGAAAACATATT -TATTATGTTTAAATTCACTTTTATTTTATTTATTAATTATTATTTTCAGACAGCGTCTCA -CTCTGTCGCCTAGGCTGGAGTGCAGTGGCGCGATCTCAGCTCACTGCAACCTCCGCCTCC -TGGGTTCAAGTGATTCTCCCTGCCTCAGCCTCCGAAGTAGCTAGGATTACAGGCAAGTGC -CACCACACTGGCTAATTTTTGTATTTTTAGTAGAGATGGGGTTTCACCGTGTTGGCCAGG -CTGGTCTCGAACTCACAACCTCAAGTGATCCACCCGCCTTGGCCTCCCAAAGTTCTGGGA -TTACAGGCGTGAGCCACCGCGCCCAGCCAAATTCACTTTTAACAATAGAAATTTCCCCAT -CTATTATTTCATTCACTTGTATTTATCACAAGTGCTATTAAAAACATTACAGTGTCCAGG -TTAAGATTCATAAGTTATGAAATCAGCTTTTTCAAATAAATGAGCAAAAGACAATTTTTG -AATAGACAAAATACGGAAGGGCTTAATTAGGTAAATTGTTAAAGGAAAAGCAAATAAACA -CATAAAAATAATTTTAAATATGCAAACTAAAATAAGATATTTTAATCCCCTACTGAATTT -AGCTTAACAATTATAATACCTAGTACATTATAGGTAGGTGTGTAAATTGGTACATCTAGA -ACACAATACAGAAAAAGCCTTAAAATGATCATATTCACTGACCCAGTAATTCTACTCCCG -GCAATTTATATTCAGAATAATTAAAGATGTAGGCTGAGTGCAGTGGCTCACACCCTGTAA -TCCCAGCACTTTGGGAGGCTGAGACGAACAGATAAGTTAAGGTCAGGAGTTCAAGACCAG -CCTGGCCAACATGGCGAAACCCCGTCTCTACTAAAAACACAAAAAATTAGTCAGGCATGG -TGGCAGGTGCCTGTAATCCGTGCTACTCAGGAGGCTGAGGCGGGAGAATCGCTTGAACTC -AGGAATCGGAGGTTACAGTGAGCTGATATTACACCACTGCACTCCAGCTTGGGAGACAGA -GCAAGACTCTGTCTCAAAAAATATCTAATAATAAAGATGCAGATAATGATTTAATTATAA -GGAAAGTATTTATAATTTCCAAAAACTAAAAACAATTTAATTTTGAAAAATTTAAAAATT -AAAATACCAAACTATAACCATGCATTGGAATATAATTCACCTATTAAAACCACATTTCTG -ATCAATTTCTAATAACATGGAAAAGAAAACATTCACATCTAAGGATAAAGAGCAGTATAC -AAAATTATTTTCTCATCCCAAAGAATATGGGAGTAGGGGAGAGAGAGAGAAAGAGAGAGA -GGACAGAAGATATTTTTTAAGGTATGTACATATGTGTTTCTAAGTATCTAGAAAAAATAC -TCAATTACAATAAACCAAAATTTTAACAATCAGAAAAAAAAATCTATATGAAATGAATTA -TTTATGAAATTAGGAAGAACATTTCATCTACTTTCTCCCTTGGTTGACATTAAAAAAAAT -TACATTTTCCTAACAATATAATTAACATAGTCTCAAGTAGAAAGCGGGAACTCTGTTTAA -AAAAAAAAAAAATTATAGGGCCAGGCACGGTGGCTCATGCCTGTAATCCCAGCACTTTGG -GAGGCCAAGACGGGCAGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACGGTG -AAACCCTGTCTCTACTAAAAATACAAAAAATTAGCCAGGTGTGGTGGCACGCACCTGTAG -TCCCAGCTACTTGGGAGGCTGAGTCAGGAGAATCGCTTGAACCCGGGAGGCAGAGGTTGC -AGTGAGCCGAGATCACGCCACCACACTCCAGCCTGGGTGACAGAGCAAGACCCCGTCTCA -AAAAAAAACAAAAACAAAAAACTTACATGACCATAAATTGTTATCTCATTCCAGTCATAG -CAGAGCTGTAGAATTTCATTTTATTCTTTGAGGCATTAGTCACTAGTTGTACTGAAATGC -CAATGGAACTTACCTGAATCAACAGAAATGTTAAGAACAACAAATGGATACTGGTGTCGA -TTATACATGTGGTAGACCTCATTCACGAGTCTGCAGACCTGCACAAAATACAAGGAGTAG -AAAAGAATAAATGACAAATGTTCCCAGCCCCCCGCATTCTAACAACATTCTATTCTAACC -AACCAGCATGTTCTTAGAAGGGGATACTTTTTTGTTTTTTTTTTTTTTGAGTCAAGGTCT -CGCCTTGTCACAGCCTGGAGTGCAGTGGAGCAATCATGGCTCACTGCAGCCTCAACCTCC -CAGGCTCAAGTGATCCTCCTGTGTCAGCCTGACATGTAACTTGGATTACAGGCAGGATTT -TTTTTTCTTTTTTTTTTTCAACGGAGTCTCGCTCTTGTTACCCAGACTGGAGTGTAATGG -CACGATCTTGGCTCACTGCAACCTCTGCCTCCGGGGCTCAAGTGATTATCCTGACTCAGC -CTCCAGAGTAGCTGGGATTACAGGCACACGCCACCATGACCAGATAATTTTTGTGTTTTT -A +>chr7_5957000_6010000 +CTCGTTTCTAAAAAAAAAAAAATTATTTTTTTAGTTAGCCAGGCATGGTGGCAGTGGGCA +CCTCTGTAGTCTCAGCTACAGGGGAGGCTGAGGTGGGAGGATCGCTTGAGCCAAGGAGGT +AGAGAGCCCTGATTGCACAACTGCAGTCCAGCCTGGGCAACAGAGCAAGACTCTGTCTCT +AAAAACAAACGAACACGCTGGGCGCTGTGGCTTACGCCTGTAATCCTAGCACTCTGGGAA +GCCGAGGCAGGTGGATCACTTGAGGTCAGGAGTTCGAAACCAGTCTGGCCAACATGGTGA +AACCCCGTCTCTACTGAAAATACAAAAAAAAAAAAAAATTAGCCGGGCCATGGTGGTGGG +TGCCTGTAATCTCAGCTACTCCAGAGGCTGAGGCAGGAGAATTGCTTGAACCCAGGAGGT +GGAGGCTGCAGTGAGCTGAGATCCTGCCACCGCACTCCAGCCTGGGCAACAGAGCAAGAC +TCTGTCTCTAAAAACAAACAAACAGGCTGGGTGTGGTGGCTCACGCCTGTAATCGCAGCA +CTTTAGGAGGCTGAGGCGCGCGGATCACTTGAGGTCCGGAGTTCGAAACCAACCTGGCCA +ACATGGTGAAACCCCGTCTCTACTAAAAATACAAAAAAAACAATTAGCCCGGCCGTGGTG +GTGGTGGGTACCTGTAATCTCAGCTACTCCAGAGGCTGAGGCAGGAGAATTGCTTGAACC +CGGGAGGTGGAGGCTGCAGTGAGCCAAGATTGCGCCAGTGCACTCCAGCCTGGGAGACAG +ACAGAGAGAGACTCTGTCTCAAAACAAAAACAAAAACAAAAACAAAACCCAAAAAGAAAT +ATACATGTGTTGAGAATCGGCGGAGCATCCGCCTCTGGGTATAAGCTGCTACCCCGCCCG +GGCGTACCTGGATGCCCCTCTCCCACCGCCCGGTGTACTCTTCGTTGGTGGTCAGCCACC +TCATCCTCCCCTCCCCGTGGCGCATGTTGTCTTCCCACTGGCCTTCGTATATATTTCCAG +ATTTATAACTAGGATGAAAGAAACCAAAGAAAAACAATCAGTTACCTCCTACACAACATT +TACCTTTAAGACATTCTTTTAAACACTCCCCTTGAGCTCCTTTGAAGAAATCCACCCCTT +GTACTTATACAATCTTCTCTGTATTTAAATTCAGGCCAGGCGTGGTGGCTCACGCCTGTA +ATCCCAGCACTTTGGGAGGCCGAGGCTGGAGGATCACCTGAGGTTGGGAGTTTGAGACCA +GCCTGACCAACATGGAGAAACTCCATCTCTACTAAAAATACAAAATTAGCCCAGCTACTT +GGGAGGCAAAACTCCATCTCAAAAGAAAAAAAAAAATGCAAAAATTAGCCGGACATGGTG +GCAGGCACCTGTAATCCCAGCTATTCAGGAGGCTGAGGCAGGAGAATCACTTGAACTCAG +AAGGTGCAGGTTGCAATGAGCCGAGATCATGCCACTGCACTCTAGCCTGGGCAACAGAGC +GAGACTGTCTAAAAAATAAATAAATAAAATTTTTAAAAAATCAATGGATAGGCTCATGGT +CCTAAGGGAGCAGAATGAGTCACTTTATTAAATCTTCTGACTATTTAATAAGGGGACAAA +GTGGGTAAGAGCCGGGTTTTTAAAATTTTTTAATAATTCCCTATTGTATCATGATTAGTG +AATATTTGGCCAGTTTTTGAGATGAGATCTCACTGTGTCACCAAGGCTGGAGAGCAGTGG +TGTGATCATGGCAGGAGAATTGCTTGAACCCAGAAGGCAGAGGTTGAAGTGAGCTGAGAT +GGCACCACTGCACTCCAGCCTGGGTGACAGAACAAGACTCCGTCTCAAAGAAAAGAGAAA +AAATCCACTCTGCTTAGAGAGAAAATGTTCCGTGCAACTTTTGCATCTTACTTTTAAATA +TCCGAGGTGAACGCTATTGGGCCCACAAACCCTTCTTCATCTACACCCCAAGCGCGGCGG +TGGTCATACCTACCATCTTATTCCCCAGCCCTTTTTGATGTTTTGTACCCAGTCTCCCTC +GTACCAACACGTACCCTCTTGATTGTAATAAATGGAGCCCTGAAACAAATAATGTCATCT +TTAAAACTATCAAGCCTCATGACACAAATGCTTTGTCAAATGTAAGGATATTAACTTGAA +AAGTAGAACCTACACAGAGGTCAATGTCATACATAGGCAAGACATGTAAACTGCTATTTT +TCTGTTTTGCTATCAAGAAAATGGTAAAACTGCTGCACAAAGGGAAATGAGATAATGTCA +CAAATCAATTGCTCCTTAATAAAGTGCCATATTGGCCAGGCACGGTGGCTCACGTCTGTA +ATCCCAGCACTTTGGGAGGCCGAGGTGGGCGGATCACAAGGTCATGAGTTCAAGACCAGC +CTGGCCAACACGGTGAAACCCCGTCTCTACTAAAAACACAAAAATTAGCTAGGAGTGGTG +GAGCGTGCCTGTAATCCCAGCTACTTGGGAGGCTGAGGCAGGATAATCGCTTGAACCTGG +GAGGCAGAGGTTGCAGTGAGCCCAGATCGTGCCACTGCACTCCAGCCTGGGCAACAGAGC +AAGACTCCATCTCAAAATAAAATAAAATAAAAAGTATCACATTAAGGCACAGAATGACTG +TATTCATCATATTCGAGTATATTCATTCTATCCAGTAACTATTAGTCAATTAAGTACCTA +GAGAAATCCTGTCTGTTGCCACCTGGAGTGAACAGTTGCGCCTTCCATGTAACGGAAGGT +CACTCTCTCTTAGGCACCAGATCCACTGTTGTTTTACCCATTTGGACATGCTACTCATTT +TACCGCCTCCGAGTATAAGTGAGCATAGAGTACCCTTTGTTTGATCTACATAGAAAAGCC +TCAAAAGGCTTTTTCACAGGTTTATCTGTGTGTGTGAGAGAGAATTTTTCTATCTTCTTT +CTCATGATCAGGCAAACTCATTCCTTCTTGCAGCCATGCAGATGCTGCTGTCTAGAAGTC +ACCACCCCCAATCCCTCCAATATGTCTCAAGCAATCTGCTGTAAAACACACACACACACA +CACACACACACACACACACAACAACAACAACAACACAACTCAATAAATAGCCTATTAAAG +CATGCATACGGCCAGGCACAGTGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCTG +AGGTGGGTGGATCACTTGGGATCAGGAGTTCAAGACCACCCTGGCCAACATGGCGAAACC +CCATCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGTGCACACCTGTAGTCCCAG +CAACCTGGGAGGCTGAGGCAGGAGATTTGCTTGAACCCGGGAGGCAGAGGTTGCAGTGAG +CTGAGATGGCACCATTGCACTCCCGCCTGGGCGACAGAGCAAGACTCCATCTCAAAAAAA +AAAAAAATTAATAAAATGGTTAATTTATGTGATGTGAATTTCGCCTCAATAAACAAAAAG +TGAATATGCCCTGGACAGCGCCGCTAGCCCCTACCCCCTTCTCTCCCTCCATGTGGCCAC +CCAGCCCCTCCCCTGCCCTCCACATGGCCACCCCACCCCCTTTCTGCCCCCCCGACCTCC +CCGACCTTGCCCCCTCATGGCTGCCCCCCCCATGTCCGCCCACCCCCTTCACTCCTGCCC +CACCTGCCCTCCACGTGGCCACCTCGCCCACCTTCCCGTGCCGCTTGCCATTGCACCAGT +GGCCGATGTAGGACACAGGCTGGGTGCTGCACTTGAACATCCCGAATCCGTTCCTCATGC +CGTTGACCACTTCGCCTTCATACATGCTGCCGTCCGGCCACGTGTACACGCCGTGGTTCA +TCGGGACATTCTTCACAAAGTCGCCCTGAAGCAGAACGGCCATGGGGTGACAGAAGGAAG +TGTTGGGGGGTGGGGGCGGGAATCCCTAGTCCTGCGGGCGGTTCCAGGAGCTGCTTGACC +TCTGATTCTGTTCTTGCCTCTCCTGTGGACACACTGAACATCCCCCTCACACTCTCTCTC +TTCCTTCCTTGTCTGCTCTCATCGCATCCTCTCTCATCTGACCCGACCAGTGGGCGGAAG +CTCAGGCAGGAGGAAATATCTGGGAGGTTGCAGGTTGACTAAGTTCGAAGAAACAAGCAG +GTGACGTTGGAAAGTGCTGGCTTCCAATCCTGACCTGGGGAACTTCAGATTCTTAGAACC +CACCTTGGCAAGGTGCAGTGGCTCACACTTGTAATCACAGCACTTTGGGAGACTGAGGCG +GGAGGACTGCTTGAGGCCGGGAATTTGAGGCCAGTCTGGGCAACCTAGGAAGACCCTGTC +TCTAGAAAAAGATTTTATTTGTTTTTGTTTTTATTTTTGAGACAGAGTCTCACTCTGTCG +CCCAGGCTGTAGTGCAATGGCGCCATCTCGGCTCACTGCAACCTCTGCCTCCCAGGTTCA +AGCAGTTCTCCTGCCTCAGCCTCCCAAGTAGCTGGGATTACAGGCACCCATCATCACACC +CTGCTAATTTTTTTTGTATTTTTAGGAGAGACGGGGTTTTGCCATGTTGGCCAGGCTGGT +CTCGAACTCCTGACCTGAGGTGATCCACCTGCCTCGGCTTCCCAAAGTGCTGAGATTAAC +AGGCATTTAACAGGCATGAGCCATCATGCCTAGTTTTTGTGGATTTTTTGTTGTTGTTTT +TTTGTTTTTTTGAGACAGGGTCTCACCCTGTCACCTAGGTTGGAGTGCAGCGGCACAATC +ATAGCTCACTGCAGCCTCGACCTCCCAGGCTCAAGAGATCCTCCCACCACAGCCCCCCAA +GTAGCTGAGACTACAAGTGTGTGTGCCACCAAGCCTCACTACTTTTTAAATTTTTTGTGG +AGATGGAGTTTCTCTATGTTGCCCAGGCTGGTCTGGTCTCAAACTCCCAGCCTCAAGTGA +TCTTCCCACCTTGGCCTCCCAAGTAGCTGGGACTACAGGTGCTGGCCACCAAGGTGCAGT +GGTGCACGCCTATAATCCCAGCACTTTGGGGGTGCTGACGTGAGAGGATCTGTTGAGCCC +AGGAGGTTGAGGCTGCAGTGAACTATGACCACTGCATTCCAGCCTGGGCGACAGAGCAAG +ATCCTGTCTCTAATGAAAAAAAAAATAACCCGCTCGAAGGAGGTGAATTCACTGTTCCCT +CCAAGGCTTAGTGATGACTGGGGACATCCCTCTTTCTTTTTCCTTTTTTTTTCAAGATGG +AGTTTTGCTCTTGTTCCCCAGGCTGGAGTGTAATGGTGTAGTCTCGGCTCACTGCAACCT +CCGCCTCCCAGGTTTAAGCAATTCTCCTGCCTCAGCTTTCCGAGTAGCTGGGATCACAGG +TGTGCACCACCATGCCCCGCAAATTTTTGTAGTTTTAGTAGAGACAGGATTTCACCATAT +TGGCCAGGCTGGTCTTGAACTCCTGACCTCAGATGATCTGCCCACCTTGGCCTCCCAAAG +TATTGGGATTACAGGCGTGAGCCACCATGCCCGGTCAGGAAATCCCTCTTTCTGCCACGG +TCATCAAAATAGTCTGTAAACAAATCAGCCAACAGCCTGCCCCAGGGGCACCTGCCAGGG +AACGCGCTCTGCCCAGGACGCCTGAGTGGGCAGCAGGCAGCACAGTGCACAGCACCCAGC +AGCATCGGATTCTCTTCCAGGAACCTGAACTCCCTGGAGGCAGCCACAGCAGCAGAGAAA +AGAGGACAGCACGCCGTGGCCTGATCACCAGCCAGGACCCATGAGGCCAGTCGGCCTCTG +AGAATGCTTCTAGGAGCCCCCCGAGTCCTGCCCAGAAGCCCCCCTGACTGGGCTGGAGTG +GGGGTCTGTGCCTGCAAAAATGACCTCCCCCCCTGCCGGGAGTTTCCCGAGACAACGAGG +CACAGGGCGGTTCTTGGTAAGTTGTCACTTAAGGACCAGAAACTGGCCCAGTGCGGTGGC +TCACACCTGTAATCCCTGCACTTCGGGAGGCTGAGGTGGGCAGATCACCTGAAGCCAGGG +GTTTGAGACCAGCCTGGCCAACATGGCGAAAGCCCGTCTCTACTAAAAATACAAAAAGTA +GCCCGGCGTGGTGGCGGGCGCCTGTAATCCCAGCTACTCTGGAGGCTGAGGCAGGAGAAT +TGCTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCGAGATCCCCCCGCTGCACTCCAGCC +TGGGTGACAGAGCAAGACTCTGTCCCACAAAAATAAATAAAATAAAGACCAGAAACCTTA +CATGTCAGCCACCGGCTAGAAGGCGGGATGTCGCGTGGGAAGGGAGCTGGCATGAACCCA +AGGTGGGGGCCCAATCCTCAGGCTCCCCTGGAACTTGGAGATCCTCCTCGCCCCGCCAGT +GACGGTCAGCCCCTCCCTCCCTCTCCCCGCTCCTCTGCAGCATGCCTCTCACCGCCCAGC +TGCAGGTGGCTTCCCGGCCCAAACTTGACTCCGTTTCCATCATTGCCTGTGTGTTATTTG +AATAAGTGCGTTATGCGCATGTGTTTTAAATGTCATCATTACCATTTATAAACACCATCT +GTTAGCAACTCTGCATTTGGGATTTTTAGAATAGCATTTCAGGTGCTCACTCACTTTGTG +GGTGGGAATTGAGCCTGGTACAATCTCTTGGCGAACAATTTGGTCCTTGCAATCAGCTTA +AAAATACACATTCCCCTCAACCCCACAAGACAGGTTAAATAAAAGCCACATAATGGAATA +CATGCAGCCACTAAAAACAGATCTACATGAATGGATATGGTTTGATCTCAAAATTAAAGG +TACAGGCCAGGTGTGGTGGCTCACGCCTGTAATCCCCAGCACTTTGGGAGGCCAAGGTGG +GAGGATCGCTTAAGCTTAGGAGTTCGAGACCAGCCTGGGCAACATGGCAAACCCTGTCTC +TACAAAAAAAAAAAAAAAAAGTAAAAATAAATTAGCCGCGTGCTGCGGAGCACACCTCTA +GTCACAGCTACTCAGCAGGCTGAGCCAACAGGATCGCTTGAGCCTAGGAGTTCAAGGCTG +CAGTGAGTCATGATCTCACCACTGCACTACAGCCTGGGTGACAGAGCAAGACCCCATCTC +AGACTCACTAACTAACTAAGTAAATATGCCAAAGAGAGTGTATAATAAACTATGTGTGTT +TGTAAAAAGCAAGACAGGCTACAGAAGTTCCAGGCTGCAGTGTTATGATCGTACCACTAT +ACTCCAGCCTGGGCAACAGAGCAAGACCCTGTCTCAAAGAAAAAAGTAGGACAAGCTACA +TACATGTACGTGTGCTCTCTGTGCTTAGAACACATAGAATACCTCTAGAACACACAGATG +AAACCAATAACAATTACTGGCGGGTCCCATGCAGTCATGAGTTACTAGATCCTCTGGTTC +TGCAAATTTTTCTTAACCCATATGCTGAATGACATCTACGAAAACAGTCTGTTCAATTGT +GGGAAACTGATTGTTCCATCCAATAATCACAGCTTAGAACTATAACTGGTTATATGCCTC +ACCTCATATTTTAATCCATCGGCCCAAATATAAGTCCCCTGTCCATGCATGAGTCCTTCT +GAAAACATACCCTTCAAAACAAAACAAAGCAACGACAAACACTTAGAATACAGCTGACAC +ATATACATATTTGAGATAGGGTCTGGTTCTGTCACCCAGGCTGGAGTGCAGTGGTGTGAT +CATAGCTCACTGCAGCCTCGAACTCCCAGGCTCAAGCAATCCTCCCACTTCAGCCTCCCG +AGTAGCTGGGACTACAGGCATCCACCACCATGCCCAGCTAATTTTTGTATTTTTTGTGGA +GACGGGATTTCACCATGTTGGCCAGGCTGGTCTTGAAATCCTGAGCTCTAGCAATGCGCC +CGCCTTGGCCTCCCAAAGTGCTGGGATTATAGGCATGAGCCACCGCGCCTGGCCTGCAGC +TGATGATTCTCTCCCACAACTGCCTTATCCCGATTTCACATGCGTGAAGATGCTTGTCTG +CACACTCAGCACCAGCTGAGTCCTAGTGAGTCCTACTCTGAGCTGCCTCCATGCTGGGCT +CCATCCTTCTCTAAAAAGGATCTAAGAGGTCCTCATCTTCATGACCTAAGGATGACCTCA +GCTACAAAAATGTGTTCTCAACCGGGTGCGGGGGCTCACACCTGCAATCCCAGCACTTTA +GGAGTCTGAGGCAGGAGGATAACTTGTGCCCGGCAGTTCAAGACCAGCCCTGGCAACGTA +GCAACTCCTTGTCTCTACCAAAAAAAAAAAAAAAAAAATTAAATTAGCCAGGCGTGCTAG +CTCACACCTGTAGTCCCAGCTATTCAAGAGGCTGAGGAGGGAGGATCATTTGACTCCAGG +AGGTCGAGGCCACAATGAGTTATGATTGTGCCACTGCACTCCAGCTTGGGTGACACAGTG +AGACCCTGTCTCAAAAAATATAAAATAATCAGGAAAAGAAACAAATCTAAAATAACTTTT +GTTATATTGAGCATTATTTTTACCTTAAATAGGTAATCAGGTTTCAGAATAAAATCGGCA +TGAAGAGCTTCCGATTTCTTTTGAAGCATCAGTGGATTTTACTGAAGATTTACAAATCTA +CGACCATCACCCCACACCTTCCTCCCCTTCCTGCAGGTTCTCAAATGGGCAACTTACACG +ATAGGTACAACCGCCTTGAAAGGCTGCGAAGCCTTCTCCCTCATACAGCCCACGAACCTT +TTCCCCTTCATAGCTACAAAGAAATAAAGGTAATTCAAGGTAATGAACAATGTGAATAAA +CCCAAGTGACAGTGGGTTAAACTATATAACTATGTAATGGGAAGAATGAAGTCAGAAAAA +AAAAAATATATATATATATATATACACAGAGCTAGAAAGTAGAAGAGGTTACCAGGGGTT +TGAAAGTAGGGTGAGGAATGAAGGCGTTTCGGGGTTTTTTTGTTTGTTTTTTGGGGATTT +TTTTTGAGATGGAGTCTCACTCTGTCGCCCGGGCTGGATGGAGTGCAATGACGTGATCTT +GGCTCACTGCAACCTCTGCCTCCCGGGTTCAAGTGATTCTCCCGCCTCAGCCTCCTGAGT +AGCTGGGATTACAGGCACATGTCACCACGCCCAGCTAATTATTGTGTTTTTAGTAGAGAT +GGAGTTTCACCATATTGGCCAGACTGGTCTCAAACTCCTGGCCTCAAGTGATCTGCCCGC +CTCAGCCTCCCAAAGTGCTGGGATTACAGGCTTGAACCACCGCATCTGGCCAGGAGTTAC +TATTTAATAGACGGTCGTACAACACTATGAACGTACTTAATGCCATTGAATTGTACACTT +AAAATAATTAAGATAGTACATTTTGTTATATGTTTCACCACAATAAACTCTATATATACA +CACGCCATGGGGCTGTATGTTTGCTATTTGGGTGATGGGCTTACTTAGAAGCCCAAACCT +CAGCATCACACAACATGCCCATGTAACAAACCTGCACATGTAACCCTCTAAATCTAAAAT +AAAATAATTTTTTTAAATACATAAAATTACCTTCAGGCCAGGCACAGTGGCTTACGCCTG +TAATCCCAGCACTTTGGGAGGCTGAGGCAGGTGGCTCACCTGAGGTCAGGAGTTCGAGAC +CAGCCTGGCCAACAGGGTGAAACCTTGTCTCTACTAAAAGTACAAAAATTAGCCAGGCAT +GGTGGCGGGCACCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATTGCTTGAAT +GTGGGAGGTGGAGGTTGCAGTGAGCCAAGATCACACCACTGCACTCCAGCCTGAACGACA +GAGTGAAACTCTGTCTCAAAGTAAAATAAGATAAACCGCCTGACTGGCAGTGTTATACCC +GATGGCACCCCCATTAAAATCACCTTTCCACTATGAGTTTGGTCAGAATGGACTCTTCGT +ATTGGGTGGCATCTTCGTTCTGCTGAACGTTTTGGCGGTCTTTTTTGGGTTTCACTTCGT +TGAGCTGCATTCCCAGCAATGGGACACCAGCTGGGGACATCTCTTGCCTAGTGGTGTTGC +CATCTTGTTTGGAAAAGTCTAGATTATCAGAGAGAGATGAGGGAGAGCGGGCAGACTTCT +CCCCTTTTTTGTCTGCTTTTTTCTTTTCTTTCACCATTGCCTTGGGAAGATCCAATGGTT +ACTTGAATCAAATGATTTCTTTGGTTCAGAGCTGCTTGTTTCAAAGCACTGATGAGTTTT +ATCTGAAAAATAAAAATTACGTCTCCAAACACTTGGGGTTTTCATTTGTAGTTAAAATTT +CAGTTTTACAACACAATGTCATTATCATTCTCCTGACAAAGTCTGAAAAATTAGTTACCA +GGGCCGGGTGTGGTGGCTCACACCTGCGATCTCAGCACGTTGAAGGGCCAAGGTGGGAGG +ATCATGTGAGTCCAGGAGAGGGAGATCAGCCTAGGCCACGTAGTGAGATGCCACCTCTCT +ACAAAAAATAAAAATAAATTAGCCAGGCGTGGTGGCACATGCCTGTAGTCCCAGCTACTA +GGGAGGCTCAGGTGGGAGGACTGCTTGAGCCTGGGAGGTCGAGGCTGCAGTGAGTAGTGT +CACACCACTGCACTCCAGTCTGGGTATCAGAGCAAGACTCTGTCTCAAAAATGACTATAA +TTACAAGTTTCAAGTACCATCAGTTTATAAAAATACAACCTCAACATCGCATTGCTTGTT +CCTAAAATTTTTTTATTTTTAATTTTTGAGACAGAGTCTCACTCTGTCACCCAGGCTGGA +GGGCAGTGGCACAATCACAGCTCACTCTAGCCTCAACCTCCTAGGCTCTGACGATCCTTC +CATCTCAGCCTCCCAAGTAGCTGGGACCACAGGCATGCATTACCACACCTGGCTAATTTT +TTGTAGAGACAGGGTCTTGCTATCTTGCCCCGGCTGGTCTGGAACTCCTGAGCTCAAGCA +ATCCGCCTGTCTCAGCCTCCCAAAGTGCTGGGATTATAGGTGTGAGCCACTGTACCTTGC +CCCAAAAATTATTTAAGTTGGAACCATTGTCTAGCATTGTTTCTTGAAAGGTAACCCTAC +ACATGAAATAGGCTACTTCACCTCTCAGGTCTTGCATGCAGCCAATTCACACTTTAAAAG +CCCCTCTCTGGCCGGATGCAGTGGCTCACACCTGTAGTCCCAGCACTTTGGGAGGCCAAG +GCAGGTGGATCACGAGGTCAGGAGATTGAGACCACCCTGGCTAACACTGTGAAACCCCGT +CTCTACTAAAAATACAAAAAATTAGCCAGGCATGGTGGCACATGCCTGTAATCCCAGCTA +CTCAGGAGGCTGAGGCAGGAGAATCACTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCG +AGATCACACCACTGCACTCTAGCCTCGGCAACAGAGCAAGATTCTGTCTCAAAAAAAACA +AAACAAAACAAAAGCCCCTCTCCTTATAGGTCAGCATTGTAAAGTGTGCAAGAGCTGGAT +TCGGAGTCCTGCATTGCCCATTACCAGTTCTATGGGTTTGTTTATTTATTTATTTATTTA +TTTTTGAGACGGAGTCTCACTCTCTTGCCCAGGCTGGAGTGCGGTGGTGCGATCTTGGCT +CACTGCAAGCTCCACCTCCCGGGTTCATGCCATTCTCCTGCCTCAGCCTCCTGAGTAGCT +AGGACTACAGGCGCCCACCACCACACCTGGCTAATTCTTTTTGTATTTTTAGTAGAGACG +GGGTTTCACCGGGTTAGCCAGGATGGTCTCAATCTCCTGACCTCGTGATCTGCCCGCCTT +GGCCTCCAAAGTGCTGGGATTACAGGCGTGAGTCACCGGGTGTGGGTGCCCGGCCCAGTT +CTGTGTTTTTTGGGTTTGTTTTTTTTTTTTTTTTTAGACAGACTCTCTAGCCCTGTCCTG +CAGGTTGGAATGCAGTGGCAGGATCTTGGCTCACTGGCTCACTGCAACCTCACTGCAGGT +TCAAGTGATTCTCCTGCCTCAGCCTCTCGAGTAGCTGGGATTACAGGCACCTGCCTCCAT +ACTCAGCTAATTTTTGTATTTTTAGTAGAGATGGGGTTTCACTGTGTTGGCCAGGCTGGT +GTCGAACTCCTGACCTCGTGATCTGCCCGCCTTGGCCTCCCAAAGTGCTGGGATAACAAG +TGTGAGCCACCGTGCCTGGCTGGTTTCCTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTGA +GACGGGGTGTTGTACATTTTGCCCAGGCTGGTTTCAAACTCCTGGCCTCAAGCAATCTTC +CCACCTTCTCCTCCCAAAGTGCTAGGATTGCGGGCATGAGCCACTGAGCTCGGCCAAGTG +CTGTGTTCTGAAGCAAGCTGCTTAATCTCCTCTGCCTCACAAATAGAAATAACAGAACCT +TGTCTCATAAGAATTAAACCGATGACACACAGAAAAATCCCTAAGTACAGGATACAGAGC +AAAGTCAATAAATTGAGTGATTATCTCGTCCCTTTCCTGTTTTCAAACTTGAAATCATTG +GTTTCCCACTCCCTCTAGCACTGCCATCGATTGAGTGCCTCTCATATGCCGGACAAGCAA +GGACCGGTGTGCTGGAGTTGCGTTTCCAGCGCATGGTTGCTTGAGCTGTATTTCCAGCGC +ATCGTTGCTCGAGCTCCGTTTCCAGCGCATATCTTTGCTTGTCTGGCATATGAGCTGCGG +TGCAGGGTTTCAAAGCCATAGTTTTCATGGCTTTCCTAATCTGGCCCCGCTGAAAGCACC +CTGGTCCATCAGGCAGGATGCATAGGTGAGCCCTGTGGTGAAGGCCAGGTCTGGTCCCTT +TTCGTAGGCCCCGACGGGTGCAGTGGGCACTTCTTGCCCTCTTCTTCCTGGATGCCATCC +TCTGGACACCCCACCCTCCAGCTGAACCCATCTCCAGCCTTCTCTCTTCCTCCATTATTT +ATTTATTGAGACAGGGTCTCGCTCTGTCACCCAGGCTGGAGTGCAGTGGCACAGTCTTGG +CTCACTGCAACCTTCCGGGTTCAAGTGATTCTTCTGCCCTAGCCTCCCAAGTAGTTGGGA +TTACAGGTGCCTGCAACCACTCCCGGCTAATTTTTGTATTTTTAGTAGAGCCAGGGTTTC +ACCATGTTGCCCAGGCTGGTCTCAAACTCCTAACCTCAGGTGATCCGCCCGCCTCGGCCT +CCCAAAAGTGCTGGGGTTACAGGCGTGAGCCACCGCGCCCGGCCAAGCCTTCTCGCTTCC +TTCCAACACCCTTGCTCCTTCCCGCCCCCGACTACTGTCTCAGCGAAGCCGCCCCTGGGT +CCCCTAGCCCAAGGTGCTCTCACCTCTAAATTTAGAGGGGCCTTTACTACGAGCTTTTCG +GTCTTCTGTCAGTGATCTACAAATAAGTGAACTACAAATCAAGCCAATTTCGTTTCTCAG +TGCGTTTCCTAATGTTTCCTCTGTTCTCCTGGGCTTAAGGAGAGGCCATCTCTCTCCTGT +GTCTACGGTGAGCCGGGAAGAATCGGCTCCCTGCACTGGTCTGCCCGGCCTAGGCCCTCC +TCGCCCATCACGCACGTGCTCGGGTCCTGGGAGGCCGCGTCAGTCCGGCCGGGAAGGAGC +AGGACCCAGTCGCCATGGCTGTCCCGGCGTACGCAGGACCGCGGCCTGGGGCGCTCACCT +CGCTCCAGGAGCCCAGAGACCTCGCCGGGCTCGGGCTGAGGTGTTGCCGGGCTCTCGGCG +TCCCAGACCCGGCTCCGGTCTCCAGGCAACCGCGGACGCCGCCAGGCCCACCCTGTGCTC +TTAAAGGGGCCGCGCGCCAGCGCCAAGCAGGTGTCCCGCCCTTGCTGGTCCTGAAGGCCG +GGGGAAAGGCTGGACGCTGGAGGCAGCAGGCCAGGGTTTTCCCAGCTCTGCTAACTGCTT +CATCATAAAATAGGAATAACGCAGGCATTAGTTTTCCATTGCTGCCGCAAACAAATTACC +ATAAATTTAGTGGTTCGAAGCAACACAAATTTATTACCCTACAGTATGTAAATTAGTCCC +ACAGTGCTGGTTCCTTCCAGAGGCTGAGGGAGAGAATGCGTTTTCTTGCCTTTTCCAGCT +TTTCCAGAAGCGGTCCCCAACCTTTTTGGCACCAGAGACCGGTTTCGCGGAACACAATTT +TTCCATGGATTGGGGTCGGGGAGGGATGGTTTCAGGACGATTCAAGTGCATTGCATTTAT +TGTGCACTTTATTTCTACTATTATTACATTGTAACATATAATTAAATAATTCTACAACTC +ACCATCACAGAGACTCAGTGGGAGCCCTGAGCTTGTTTTCCTGCAACTAGACAGCCCCAT +CTGGGGGTGACGGGAGACAGTGACAGATCATCAGGCATCAGATTCTCATAAGGAGCGTGC +AACCTACATCCCTCGTGTGTGCAGTTCACAATAGGGCTCGTGCTGCTATGAGAATCTAAT +GCCCACCGCTGATGTGACAGGAGGCGGAGCTCGGGTGGTAACGCCAGCGACGGGGAGTGG +CTATAAATACAGATGAAGCTTCGCTGGCTTGCCGGCCCCTAACCTGCTGTGCACCCCACT +TCCTAATAGGCCATGGACCACTACTGGTCTGTGTCCGGAGTGTTGGAATCCCTGTTCTAG +AGACTGCTTGCAATCCTTGACTAGTGGTACCTCCTTCCATCTCCAAAACCAGCAAGACAG +CCTCTCTCTGGCCAGCAGGGAAAGGTCTCCACCTTTGAAGGACTCACCCAATGGACTGGG +CCCACCCAGACAATCCAGGATAATCTCTCTGTTGCAAGATCCTTAACTCAGCCAGGCATG +ATGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGTCGGATCACCTGAGGT +CAGGAGTTCGAGACCAGCCTGGTCAACATGGTGAAACCCTGTCTCTACTAAAAATACAAA +AATTAGCCAGTATGGTTCTGGACACCTGTAATCCCAGCTACTCGGGAGGCTGAGGTGGGA +GAATCACTTGAACCTGGGAGGCAGAGGCTGCAGTGAGCTGAGATCATGCTATTGAACTCC +AGCCTGGGCAACAAGAGCGAAACTTCATCTCAAAGAAAAAAAAAAAAAAGATCCTTCACT +CAATCACACCTGCCGAGTCCCTTCTGCCACGTGAGGCAGCGTGGTCACAGGTTCTGGGGA +TTAGGACACAGCTGTCTTGGGGGCTGTTATCCTGCCACAGCTCCCAATCTGGAGAGTTCA +TAAGTGGGATCCTGCAGACCACGCCAGCACAGTGCCAGACACGATGGCACAGTGACTACT +GTACTGCCTCCTCCATCTGAGGGATTCTAAAGCAGGAAGGGGAGCCGCCCACAGTCTGGA +GAAGGGGTGGGGGCAGCAGGGGGAGCCACATCTGTCATCTCTGGGCCCCCAAGAGGGCAT +CTTTACTTCCATTTTCAGCCAAGTTCAAACAGGACAAGGTTCCATGAAAACTATTTGAAA +AGACAGACAGGGATTCTTATATTCCCAGAACCATTCAAGGCCAGTAACTGGAATGTTCTA +CAGTTCACATCCTGAGGAAACCAAATCACAGCATCAAATTATGGGAAATCAAACTCTTTT +TGTTCCCCTGCGAGGACAGCATTTTGCGACCTTGGCCGCACAGAGGAATGTTTCAAATAG +TGACCCCTGTCCCATCCAGTCATTTTCTTCCAGCCGGGCAGAGAATCCCCCGTGTTTAAA +AATTTAATGTGAATCAGGGCTGAGAATCACTAACTGAAAAGGACCCTACTTTTAAATTTA +TGAAATTAAACAAAGATGAATTTAATTATCATTAAGGGTTGAAAGTTATAGACTAAACTA +TGTCCAGCCAGAGCAGAGGCCTGAGTAACTTCCAAAGTGGTTTGGTTTTTTTTTTTTTGT +TTTGTTTTGTTTTGTTTTTTGAGACACAGTCTTGTTCTATCTCACCCAGGCTGGAGCGCA +GTGGCGCAATCTCGGTTCACTGCAACCTCCGTCTCCCGGGTTCAAGCGATTCTCCTGCCT +CAGCCTCCTGGGTAGCGGGGATTACAGGCATGCGCCAGCACACCTGGCTAATTTTGTATT +TTTAGTAGAGGCAGGGTTTCTCCATGTTGGTCAGGCTGGTCTCGAACTTCTGATCTCAGG +TGATCCGCCGGCCTCGGCCTCCCAAAGTGCTGCGATCACAGGCATGAGCCACCATGCCCA +GCCCAAGTGTTCTTATTTTTATAAAATGTGTTCTTGCCTGGACACACACACACGAGCGCA +TGCAAACATAGAGAAAAAAAATTTGCAAGCAATGCTCCATCTGGTTTGAAAAGGTTCTCA +AGATCACTTTTAAATGGGTGTGATGTGTATTTTTTTTAAGTAGCAGGTTCATTTTAAAAC +AAAAAAGGTTAGTGAAGACTCTGTCTTTCAAAACATAAAAATCTGCGATAAAACCAATTA +TTCCATACAGTGACTACGGTCAGTTCTGAGAAATGACACCCAGGTTGGCGATGTGTCTCA +TGGTTGGCCTTCCATGGGGACAGTTCCAGGGGTGGTCCATCTCCCCCATGTGGGTGATCA +GTTTCTTCATCTCGCTTGTGTTAAGAGCAGTCCCAATCATCACCTGAGTGTGAGACACAA +TGGTTCAACGTTTTAGTAGTTTTTTGACGTCAGAATGGCAGCTCTTCAGAAGCATTCTTC +TCTAAAATAAGGCTGGACAAGATTACAGCTCAAAAACTACCTTCCCTGAAAAACCTTCCC +CCAGAGAAGCCTAGGTTCTAGATCTCAGCCCTCCACCCTTCTGTGAAATCAGGCTCCTTG +TGGCTCCTTCAAGGTGGCACCGCCTCCACTCCAGACGCCGACCACACCTGTCTCAGCAGC +CACCCTGCCCTCTCACCCTGGCAGGTGCAGCAGCCTCCCAGCAGGCCTCCCTGCCCCACT +GCGACCCCTCCGAGCCGCTCTCCACTCAGCAGCCAGTGATTACTTTTAAAGGGCTGTCAG +GTTATTCATTCCACTTCACAGCTCTCCCCCTCACCTGAATAAAAGCCCCCGTCTGTCCCC +TGACTTGGCCCTCGCTGGGCTGTGCCTGCACCCCCACCTCCAAGCACGAATGCCTCCCTT +CCTCACCCCAGCTGCACTGCTACTCCCTTCCTCTTGCACAGGCCCATCACGCAAACACCT +GCCTTGGGACTGTGGCACTCCCGGGACCCTCTCCCCCAATGGGTGCAGGCGTCACTCCCC +CTCTGTCGAGCTCCGACCTGCTGCCCATAGCACTCCAGCCCTGGCCCTGCTGCCTCCCTG +CCATGGGTCCTCTGACAGGAAGGAGAGGACACAAGCCTGAAGCCCAATGTCACCTTCTTT +CTTCCTGCAGCACCCTGAGGGCTCGCCATGTGCCAAGCACAGTCAGAAGGCTGGGGTGAC +AGCAGGTTGGAGAAGGACAGACAATCAACAAGTCAACAGAGAACCAAGACAGGTGGCACC +AGGCGAGGCGGCCTGCTCAGGTGTGGGGATGGGGTGAAGGGTGACGGTGGCAAACCCAGG +TAGAGAGGAGAGTAGGGAGAAAGGGTGTAAGGCAGGGAGGAGACTGAGGCGAGCGTGGAA +CTGGAAGGCAGCTACATGGCTGGAAGCTACATGGTGGGGAGATGGGGCTGGAAGGGTGGG +CAGGGCTCAAAGCAGGAGCCTCCTGGGCAGGCAGTGACAACACCGGAGATGGACGGGTAG +GCCAGGGCGAGAGGGAAGGAGCAGCCTGTGGTTCCCCGGGCCACTGAGTCACACTAAACT +CAGGACATCAAAACTGCCCGGCTATGAGCTCAGCTCCACGCTCTCACTCACAGACTCCAA +GACTGGAAGATCCATATTATGTCTTTTATTTTGGTGAGGTCAGGGGTGGTGGAGAGACTC +TGTCTCCCAGGCTGGAATGCAATGGTGCGATCTCAGCTCACTGCAACTCCGCCTCCCAGA +TTCAAGCAATTCTCCCGCTTCAGCCTCCCGAGTAGCTGGGATTACAGGCGCCCACCACCA +TGCCCAGCTAATTTTCGTACTTTTAGTAGGGATGGGGTTTCACCATGTTGGCCAAGCTGG +TCTCAAATTCCTGACCTCAGGTGATCAACCCACCTCCGCCTTCCAAAGTGCTGGGATTAC +AGGTGTGAGCCACCACGCCCAGCCCCTATTAGGTCTTTATCCAAGAAACACTGTGGCTAG +AAGTCAGACTCTGGGCCCTCTTCTAATTAAACTCTGCCCTTGAGTCATTTCATCTAATCT +CATGGCTGTAAATTACACCTGAAGCTCACACAGCAGGCTCCATCCCACCCACTCCCCACG +TGGCCCCCAGCTGCTGCTCTCCTCAGCGGCCGCAGCCACCGCACCCCTTCCAGTCTGTTC +TCTCTCCAGCAGCTGCAATCACGGGACTCCTTCCCGTCTGTTCTCTCCAGTGGCTCGTGC +CACACACAGCACAGACCCCCAGGGTCTAGGTATGACCGGCAACACTCTACGTGGCTGTCC +TCTGGACGCCGCTCTGCTCACTCCCTTCCCCTCTCCAGGGACACAATCAGCCTCTGGCTT +CAGTCTTGCTACTTCCTTCGCTTGGAAAGTTCTTACCCAAGAGGGCTCCATTCTACCTTT +TTTTTTTTTTTTTTTGAGACAAGGTCTTACTCTGTCACCCAGGCTGGAGTGCAGTTGCGT +GATGTTGGCTCATTGTAACCTCGACCTCCCTGGCTCAAGTGATCCTCCCACCTCAGCCTC +CTGAGTAGCTGTGACTACAGGCACATGCCACCACACCTGGCTAATCTTTTAATTTTTTGT +ACACATGGGGTCTGCCTGTGTTGCCCAGGCTGGTCTCTTAACTCCTGGCCTCAAGCAATC +CTCCTGCCTTGGCCTCCCAAAATGCTGGGATTACACGTGTGAGCCACCATGCCTGGCTTC +CATCCCACCTTTTAGATGGCAGCTGAGATGCCACCTGCCCAGATGCCATTCCCTGACCAC +CATCTCACCTGGTCACCATGTTTTTCTCTTGTCATTTCCTGCCCCAAAACGCTGTTTTAG +GCCAGGTGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGACCAAGGCGGGCAGAT +CATGAGGTCAGGAGATCAACACCAGCCTGACCAACATGGTGAAACCCCATCTCTATTAAA +AATATAAAAATTAGCCAGGTGTGGTGGGTGCCTGTAGTCCCAGCTACTTGGGAGGCTGAG +GCAGGAGAATCGCTTGAACCTGGGAGGCGGAGGTTGCAGTGAGCTGAGATCACATCACTG +CACTCCAGCCTAGTAACAGAGCGAGACTCCGTCTCAAAAACAGACAAAGAAAAATGCTGT +TTGAATCTCTTGACTGTGCTTACTGGCATCTAATGCGTGTCATTTATTTGTGGTGATGCC +TATTTCTCCCCACTGTCTGCTCCACAGGGGCAGGGGCTGCAGCCGCCTTGTTACCTCTGT +GTCCCGAGCACCTGGAGCAGGGCGGGCCCCACATCAGGGGCTCAAGGAGCACCTGCTGAA +TAAATAAAGGAATGGCGTCCTGGCCCTTCCCAGTGGCCAGCTGATACACAGTCACTTTTC +TTGGACATCAGGCTAATCCCCACTGCAGGCAGAACCACTGCTGCCACCTTCCCACACCAA +CCGAAGCAGCGGCAGTGACGCCACGTGCAATGACAACCACGGCACCCCGTGAAGCACCTG +CTGCCTCGATGACTCTGCAGAATCGTGTCCAATGTCGCCGAGTCCTGGCAGCAGCAAATC +TTTATCTCCCAATGTTGTTATGACCCATAAGGTCCATAGACGAACAAGGTACCTCAAACG +CTAACTGCGTTGGAGTCAACCAAAGCTCGGAGATAGAATACTGGCCGGGCCAGGCACAGT +GGCTCATGCCTGTAATTCCAGCACTTTGGGAGGCTGAGACAAGGGGCAAAAGGAGACCAT +GTTTCTACAAAAAATTTAAAAATTAGCTGGGCATGGTGGTGCATGCCTGTGGTCACAACT +ACTTGGGAGACAGAGAGAGGAGGATCGCTTCAGCCTGGTACGTCAAGGCTGCAGTGAGCT +GTGATTGTGCCACTGCACTCCAGCCTGGGGGACAGAGGGAGAATCTGTCTAAAAAAAAAA +AAAAGAAGAATTCTGGGTTTTTTTTGTTTTTTTGAGACGGAGTCTCGCTCTGTCGCCCAG +GTTGGAGTGCAGTGGTATGAACTTGGCTCACTGCAAGTTCCGCCTTCTGGGTTCACGCCA +TTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGACTATAGGCGCCCGACACCACGCCCGGCT +AATTTTTTTGTATTTTTAGTAGAGACGGGCTTTCACCATGTTAGCCAGGATGGTCTCGAT +CTCCTGAACTCGTGATCCGCCCGCCTCAGCTTCCCAAAGTGCTGGGATTAGAGGCTTGAG +CCACCATGCCCGGCCAAGAATACTGCTTAACAGAGGTAACAAAAGAGCAATAATTATGAG +TTCAAGGTCACAGAGAACGCAGACGACACAGATGCTCAGCTACGACGCTGCACGTAGCTC +TCTGTGTAAAATGACCCCTGGCAATCACAAAGGCGTTTACAACCTTGACCAAATCAGGAG +CTGGGCTGAGACCTTCCTCGACTGCAAGCTTGAGCAGCTGAGCTGACAGCCAGGCTTTCT +TTACTTACCGACTTCCGGCAGGCTCTGGAGGCAAACATCTGCTTGACTCGGGAAGGCCGG +CACATGACCCCAGGGCTGTCGCTCAGCATGAAGATCAGTTCATCGACGTCCTGGGGTCCG +AAGGTCCAGTTTTTACTAGTTGGCAAGGAAATCAGTTTAGCCCTTTCAGTGACTGGAGCT +AAAAGAATACAATTTTGAGAAAAATCCATGACTTGACAAACACGTTTCACTTGAAAGCTA +CTTAGGATGAACATCTGAGGCCGGGCGTGGTGGCTCACGCCTGTAATCCCTGCACTTTGG +GAGGCTGAGGCCAGCGGATCATGAGGTCAGGAGATACAGACCATCCTGGCTAACATGGTG +AAACCCCGTCTCTACTAAAAAATAGAAAAAATTAGCTGGGTGTGGTGGCAGGCACCTGTA +GTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGTGTGAACCTGGGAGGCGGAGCTTG +CAGTGAGCCGAGATCGGCACCACTGCGCTCCAGCCTGGGCGACAGAGCAAGACTCCATCT +CAGAAAAAAAAAAAGTGAACACCTGAAAGAGAGGAAACTCACAAAATGCTTTTTGGAGGA +ACTTTTTAATCTTTTATAAAATTAAAAAAAACTGGTCTATATGACCTGAAAGATTATTCC +CAGCTCTAAAAAGACAAGAATCTATAGTTCTGATTTTTTTTTTTTTTTGAGACAGAGTTT +CACTCTTGTTGCCCAGGCTGGAGTGCAGTGACGTGATCTCGGCTCACTGCAACCTCCACC +TCCCGGGTTCAAGCGATTCTCCCACCTCAGCCTCCTGAGTAGCTGGGATTACAGGCACCC +GCCACCACGCCCGGCTACTTTTTGTATTTTCAGTAGAGATGGGGTTTCACCATGTTAGCC +AGGCTGGTCTCAAACTCCTGACCTCAGGCGATCTGCCCGCCTTGGCCTCCCAGAGTGCTG +GGATTACAGACGTGAGCCACCACACCCAGCCGCTATAGTTCTAATTAATAACTTACCATT +TTCATCGATAACAAAATCAAAGCCATTCTTTCTAAATATTTCCAGATTTTCTATCAGAAC +AGCTTCATTAACAGCAGTTAAGTTGAGAGTCTGAGGTCTGAAAAACACAAAAATGATTCA +AACCATATCCTGAAGTCAAACATTTAGCTTTACAGCAGAAATGAAATGAAAACAACAATA +CTGTATTTTGAATTCATGTCAAAATAACAACACAAATAACAACACTACTCAGCTAAGTGT +CACAAAACTTCCTGAGAAGTTCCTTTTAATTTTCTCTTTCTTAAAGTTCTTTTTAGAAGT +TAAAGTAGCTACAGGCCAGGTGCGGTGGCTCACGCCTGTAATCTCAGCACTTTAGGAGCC +CGAGGCAGGCAGATCTCTTGAGGCCAGGAGTTTGAGACCGGCCTGGTCAACACAGCGAAA +CACTCTCTCTACTAAAAATATAAAAATTAGGCCAGGCATGGTGGCGCACGCCTGTAGTCC +CAGCTACTTGGGAGGCTTAGGCATGAGATTCGTTTGAACCCAGGAGGGAGGCAGAGGTTG +TAGTGAGAGCCAAGATCACGCCACTGTACTCCAGCCTGGGCGACACAACAAGACTCTGTC +TCAAAAAAAAAAAAAAAAAAAAAACACCCATAAAAACAAAAATTAGCTGGAAGTGGTGGC +TCATGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCACTAGAATTGCTTGAACCCAGGA +GGTGGAGGTTGCAGTGAGCCAAGATCACACCACTGCACTCCAGCCTGGGCAACAGGGCAA +GACTCTGTCTCAAAAAAAAAAAAAAAGTTCAAGTAGCTACAAAAGTAGTTTGCTTTTTCC +TCAGCCTGCCACGCCAATGACTCCCACTTTTTCTGAATCCTTTCCTTAAGGATAACAGTA +TCACAAAAATGCTATTTTTCCTCCTTCTAATACAGAATTTGAAACACTGGGTTAGGTCAT +TGCCAGCATTTGTAAACAGAATGAACAGACAGCTTTTATTTTGCTATCCTGTTCCTTCCT +CTGCCTGTATTATATCTCCATCCCTCTCTCCTCCTGGATTTACTGTTTGTTTTTTTTTAA +CCTTTCGTTATTTTTTTCAAAGATAGAGACAGGGTCTCACTATGTTGCCCAGGCTGCTCT +CAAACTCCTGGGCTCAAGCGATCCTTCCACTTCAGCCTCCCAAAGTGCTGGGATTACGAG +TGTGAGCCACTGCATCTGGTCCTGAGTGCTGGATAAGACAAACACTGCTCAAGGCAGGAG +ACAGCTGGTGAGCAAACACAGGCTTGGTCCTGGAGCCAACAGATTACCGGGGAAGAAAGA +CGTTGAGCAAATACTCAGGCAAGTCGATTATGATGAGAAACGACAGGAAGGTCAGGAAGA +AAAAGCAGCCAGTGTCATAGAGAGACTTCACCCTGGGGTCAGGAAGTGACCTTTGAGCTG +AGTCCGGGGATAAGAGAGTTAATCAGGTAACGGGGGAGAAGTGGGTGCAGGGTGCAGGAC +AAGTATTCTAGACAGGGACAACAATCTGTGCCAAGCCCCAGGATGGACCGCTGATGTTTG +CAGAGCCACACATAAAGATATCCTTCATTCTGCTTAGTGGCCACATAGGGATTCATCAGG +CCTGCCAAGGGAAAAAGAAAGACAGCCAGAGAGGCTTGAGTACAGGGAACAAGGGGAAGA +CGAACGGGAAAAGCTACAGAGGTCAACAGGGCCACCCTACACAGGGGCTGGCAGGGCAGG +GTGGAACTGGGTCTTTATCCTTTAATCTTGAAGTGTGGTCCATCTGGGACCCTAAGTGGT +CTGTGATTACCTGGGCCAACTTGAAATGTCACAGATGAGAGGTTATCTTTGCCGAATGGC +TAAAAAATACAAGACCTCAGCCGGGCATGGTGGCTCACACCTGTAATCCCAGCACTTTGG +GAGGCTGAGGTTGGTGGATCACCTGAGGTCAGGAGTTCAAGACCAGCCTGACAAACATGG +CAAAACTCCCTATCTATTAAAAATCCAAAAATTAGCCAGGTGTGGTGGCGGGTGCCTGTA +ATCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATCACTTGAACCCGAGAGGCAGAGGTTG +CAGTAAGCCGAGATCACATCACTGCACTCCAGTATGGGCGAAAGAGTGAAACTCTGTCTC +AAAAACACAAAAACAAAAAACCTCTATTAAGAGGAACAGGGAAGGGATATAAAGTAGCTT +ACTAAATGTCTATTATTACCATTGCCTCCTACTGAGAATAAAAACAATTCACGCATTCCA +CAGGAGAGTACTCAGCAAACTACACAGGAGAGTACTCAGCAAACTACACAGGAGAGTACT +CAGTAAACTACACAGGAGAGTACTCAGCAAACTACACAGGTTCAGTGGTACATTTCTCCA +TGTGGGATCTACTTGTTGGGATCTGAGTTTACTTCACTACGTGGTTTAATTTCCCACACG +AAAATCCATGACCTCTTCTTCTAACTTTGCTGAAGACAAGACTTTGGTTTTACATGATAC +TATCACACCTGACCTTTGTGAAGTAGTCAGGGTAAAACATTCCAGTTTGGCCGAGGAGAG +AGAAATACCAAATTCTGCAGTGACTATCTTAAAATAATTTTTAAATTTTATTTTATTTTA +TTTATTAATTTATTTGTGAGACAGAGTCTCACTGTCTCACTCTGTCACCCAGGCTGGAGA +GCTGTGCAGTGGCACGATCATGGCAGCCTCAATCTCCTGGGCTCAAACGATCCTCCCACC +TCAGCCTCCCGAATAGCTGGGACCACAGGCACACACCATCAAGTCTGACTAATTTTTTAC +ATTTGTTGTAGAGACAAGGTTTCACCATGATGCCCAGGCTGGTCTCAAACTCCTAAGCTC +GAGGGATCTGCCTGCCTCAGCCTCCCAAAGCTCTGGGATTACAGGCGTGTGCCCCTGCAT +CCAACCTGCAGTGACTATCTGACTTCTGATTACTCTACTGTCAATCAACACTGGCGCACA +GGCTGTCTGTCTTTCTGAACACACACATTCCATACACTATGCATACTAATACTCCATACT +ATCAATTGCCCTCATCAGAAGGATCTTCTGGCTAACCAGTGATCAACATTTTTAATAGCG +AAAAATACCTGATACTTAGAGAACATGTTAACCACGTGAACTGGGGCAGGTTACTCAACC +TCTCTGCATGTGCCTCAGTTTTATCGCTTGTGGAATGGTGATGGTAACAGTAACAACCCC +ATAGGTTTTTGAGGATTAAAGGAACTAATACACATACATTATTTCAACAGTGCCTGGCAG +ATTCTAGGCACTGAATAAATGGTAACTATCACTATTATGTAAAAAGTATAAAAATCTGCT +ATATGAATACTTATGGAAAAATACATATATACATATAGACACACATATAAACTATTAGGT +CTCTTTTTTTTTTTGAGATAGAATCTCGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGCG +ATCTCGGCTCACTGCAACCTCTGTCTCCCAGGTTCAAGCGATTCTCCTACCTCAGTCTCC +TGAGTAGCTGGAATTACAGGCGTGCACTGCCATGCCCAGCTAATTTTTTGTATTTTTATT +TTTTATCATTATTATTATTTTTTGAGACGGAGTTTCACTCTTGTTGCCCAGGCTGGAGTG +CGATGGCACGAACTCGGCTCGCTGCAAACTCCGCCTCCCGGGTTCAAGCGATTCTCCTGC +CTCAGCCTCCCAAGTAGCTGGGACTACAGGCGCCCGCCACCACGCCTGGCTAATTTTGTA +TTTTTAGTAGAGACAGGTCTCACCATGTTGGTCAGGCTGGTCTCGAACTCCCGACCTGAA +GTGATCTGCCCACCTCGGCCTCCCAAAGTGCCGGGATTATAGGCGTGAGCCACCGTGCCT +GGCCTTTTTGTATTTTTAGTAGAGGCGGGGTTTCACCACGTTGGCCAGGCTGGTCTCCAA +CTCCTGACCTCAGGTGATCTGCCTGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGTGTG +AGGCACCGCGCCTGGCCAACTAGATATTTTTTATTTTTTACACCCCTCCTTCCTAGATCT +CTTCTTTTTTAAAGTAGATACAAGGTCTTGCTGTGTTGTCCGGGCTGGTCTCAAACTCCT +GGCCTCTTGTGATCCTCCTGCCTTGGCCTCTATTAGATCTTCAATTTGAGGGGGAGTCTG +GGAATGAACACTAAACACACTCACGCTATGAGCCTCTGCCCCTGGAGCACGGTGTGCTGC +TGCAGCATCTCGAAGTTATACTTCTCGTCCGTGGCATGCTGGTCCACTATGAAGATATCC +TCATTCAGTTTGGTTATTATAAATCCCAGGTTAAACTGACCAATGATTTCCATTTCTGCA +AACATCGTTTTACTGCAGGTAGAAAATGTTAATTATCAGACATTTTACAAGATTATTTTT +CTGATTATGTTATAGAACACTGTAATAAAAAAAAAGTCAAACAATACAAAAACAAAATAA +AGTCCCTAGCCATCCCGCTTTCTTTTTTTTTGAAACAGAGTCTCGTTCTGTCACCCAGGC +TACAGTGCAATGGCACAATCTTGGCTCACTGCAACCTCCACCTCCCGGGTTCGAGTGATT +CTTCTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGTGCGCCACCATGCCCAGCTAATT +TTTGTATTTTTAGTAGAGACAGAGTTCCACCATGTTGGTCAGGCTGGTCTCGAACTCCTG +ACCTCATGATCTGCCCGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACTG +CGTTCGGCTTAACCATCCCACTTTCTAAAGATAACATTAATTATTCATTCATCCAACTCT +CCGGAGAAGACATCAGTTGCTACTATTAACGATTTAAATGGAATATATCCTTCTAGACCC +TTGTCTCCATATATAATTTTTTTTAATTTTAAAAAACAAAAATGGAATCTTAATTCTCCA +TTCTGTCATCACTTAATGCATCTGAAACAAGTTTTCAGACCTGTACACATAGATCTACTT +CATTATTTTTTCTTTTTTTTTTTCTTTTAAGACGGAGTCTCACTCTCTGTTGCCCAGGCT +GGACTGCAGTGGCGTGACCGTGGCTCACTGCAACCTGCGCCTCCCAGGTTCGAGCGATTC +TCCTGCCTCAGCCTCCCGAGTAGCTGGGACTACAGGCATGCACCGCCAAGCCCGGCTAAT +TTTTTTATTTTTAGTAGAGACAAGGTTTCACCATGTTGGCTAGGCTGGTCTTGAACTCCC +GACCTCAAGTGATCCACCTGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCA +CCGCACCTGGCCTACTTCATTCTTTTTAATGGCCACATAGGAATTCATTGCATGGATGTA +CCATAATTTGTCTGACAAATCCCCTACTAAAGGACATTTCAGTTGTTTCCAATTTCAATA +GCGCACTCAAAGCTGCAACAAATACTTCTGTGCATAAACCTACTCATCTGTGGGTGCATT +TCCGTGAGACAGACGCTAGAGGGAGAACTACATATGTACTTCTTGACGGGAAATCTGTGA +AAAGTCACACTCCCACCAATGGTGTGTAAGAGCACCTTTCTGCCAATGCTGGATATCAAT +CCTTCTCATCTTTGCCAGGCCCACCACTGGGTCCTTTGCGGGTGGCTTCAACATCTAATG +TCATTAAATACTAACTTAGTCAATCTGGACAAAAGACAGACACCACCGCTAACCTTCACA +CGAGAAATTGACACTGTCATTCTCAGTCCCACACAATTAAATCCGGTGAAAATGGATTTT +CCGCAGTATCAGCGCGGTGATGACAAGAAATGGCTCTGTTAAAGCAGCCATGGACGTTTT +CTGGTTCTCACCTGGTGGCCTGAGCTGAGGATGAAAGCAGCTGTAATGTAATCCCAGCAC +TTTGGGAAGACAAGGTGGGCAGATCATTTGAGGTTGGGAGTTCAAGACCAGCCTGGCCAA +CATGGTGAAACCCCATCTCTACTAAAAATAAAAAAATTAGCCAGGCATGGTGGTGGACAC +CTGTACTCCCAGCTACTTGGGAAACGAAGGCAGAAGAATCGTTTGAACCCGGGAGGCAGA +GCTTGCAGTGAGCTGAGATCGTGCCAGTGCACTCCAGCCTGGGCGAAAGAGTGAGACTCT +TGTCTCAAAAAAAAAACAAAGGAGCTGATATTGTTGTTTCTTTCTATAAGTGCTCCAGGA +AGACCCGGTCCCATGCCACCATGCTCGTCACCATCACAATCAACCACAGGGGACAGTTTG +GTGAACTGTGAGACCTCCACATGGCATGGATTACTGAGCCCACATTTCCTATGGTGAGGG +GCTCCACACAGAGCTCAAATCCAAGTCATAACCAAACCAGTCCCCAAATCCTATCTTTGA +GGGTCTGTTTCCTGGTACCAATTCCAGATCAGGCAGAGTGCAATCAATCAAGAGACAAAA +ACCACACCAGTGATTTTAACAGGGACTTTTTTTTTTAAGACAGGGTCTTGCTCTGTCACC +CAGGCTGGAGTGCAATGGCATGATCATAGCTCACTGCAGCCTCAAACTCCTGGGCTCAAG +TGAGCCTCCTGCCTCAGCCCCCTGAGTACCTGGGACTACAGGCGTACAGCAATGTACTTA +GCTAATTTTTTTTTTTTTTTTTTTTTTTTAGAGATGGGGCCTCATTATATTGCCCAGGCT +GGTCTCAAACTCCTAGCCTCAAGTGATTCTCCTGCCTCAGCCTCCCAAAGTGCTGGAATT +ACAAGGTGTGCACCACCATGTTAGGCCTGAGGAGGAAAAATGTATAATAAGGCATTACAC +AAACTAGTAAAAGGTGGTTAACTACTATGCTAAGAAATACAGGAATGGAAAATGCTACTA +TCCTAGGGAAGAGGGAGAGTCCTCAGAAAAGGAACTCTTTTTTTCTTTTTTCTTTTTCTT +TTTTTTTTTTTTGAGATGGAGTTCGCTCTTGTTGCCCAGGCTGGAGTGCAATGGTGCAAT +CTCGGCTCACCACAACCTCCACCTCCCGGGTTCAAGCAATTCTCCTGCCTCAGCCTCCCA +AGTAGCTGGGATTACAGGCATGCACCACCATATCCCACTAATTTTGCATTTTTAGTAGAG +AAAAGGTTTCTCCATGTTGGTCAGCCTGGTCTCGAACTCCCAACCTCAGGTGATCCACCC +ACCTCAGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACCATGCCCAGCAGAAAAGG +AACTCTTGTAAGAGGCTCCTACCCACTCAGGCTGAGTTTCAGACCTCCTTGGAGCAGGAG +TGGCCGCAGCCTGCTGGATGGAGAGAAGCTGCCAGAGTGAGTGATGACACAGGAACTCCT +GCCGCACAGGAGGGAAGGAAAAGAACATCCCAGAAGCATCCCAGATGCCAGCACAAATAC +CACCTCCCCTGGCGCCGATCCCAGGCTCTCCCAGGAATTGTCTGAATATGCCCTGGTTCC +CAGTACATAGATAATCTGCTCAAAAGCTGGTGCTGGCCTAAAAGACCCAAGTCTTCCATG +TGTTTGGAGTCTGTGTCCTGCCACAGAGAACAGGATCTGGCCAGGCGCAGATGCCGGAAT +TACAACTGCGCACTACCGCGCCCAGCCAATTTTATTGTAGAGACGAGGTCTCCCTATGTT +GTCCAGGCTGGTCTTGAACTCCTGGGCTCAAGTGATCCTCCCTCCTTGGCTTGGCCTCCC +AAAGTACTGGGATTACAGGTGTGAGCCACCACACCTAGCCTCAAAATACTCTTAAGAAAA +AACTTTACCTGGCCGGGTGTGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCAA +GGTGGCTGGATCACCTGAAGTCAGGAGTTCGAGACCAGCCCAGCCAACATGGTGAAACCC +TGTTTCCACCAAAAATATAAAAATTAGCCAGGCATGGTGGCGTGCACCTGTAATCCCAGC +TACTCAGGAGGCTGAGGCAGGAGAAACGCTTGAACCCGGGAGGTGGAGGCTGCAGTGAGC +CAAGATCATGCCACTGCATTCCAGCCTGCGCAACAGAGCAAGACTCTGTCTCAAAAAAAT +AAAAAATAAAAATAAAAATTTTAGATAAAAAGAGAAAAAGTAAAAAATTAAAACTTTACC +TTATCTCTTTTCTTAGTTCATCTTCGGCTGCTTGATTTTCTCCAGGACAAATCTTTGCCC +TAAACTTCCTGTAATTCTGTTCCCCTTCACTTTGCTGTGCTTCATGATGTAACTGCTTTA +TTCGTTTAGCTAAAGAACTCATAGAAAAGTCCAGGGGCACAACTTTCTTATTAATTTTCA +CAGCTACATCAACCTGAGAGGCTGACATGTCCTGAGTATTTACTAACTTTTGACAAATGT +CAGAACTGGAAAGAATTTCTTCTTTTTTAAAACGCTTTGTGTTTGGGGTTGCGAGATTAG +TTGGCTGAGGCAAAACTCGAAATTTACATCCGGTATCTTCCTGGTTTGAATGGCAGTCCA +CATCTGAAAAAGAGTCGTCAGTTTTAGGCGCTTTCTCCTGAGAGTCCACATGTTCCTGCG +AGCCCCTGTCCCCTGGGGAGCTGGCCGCATACTCGCTGCTGCAGTGACTGCCCGTGTCTG +GGATGCTGAACCCCTCAGAATCCACGGAAGTGCTGCCGTGCCCCGAGTCCTTCTCCACCT +CCGCTCTGTCCGTAGGGTCACTGGGTCCGTGACTGGAACTCACTGCCTCTTTCTGAGGTC +TCAGGACGCCTTTGTCAGAGATGGCACCTGAAGTGCTAGAAGACAGCATACCCCTTTTCT +GTCCTAGAGGGCTCCTTCTTGGTTCTGGAGTCTTTGGGCTGTGAGGCTTGTTCTCTGTTG +TGTGACGAAGAGAAAAGGCCTCTCGCAGTCTGGAAATGGACACGTCTTTTTTTTCTTCTC +CAGTCCTTAATGAAGGGGATTGATCCTGCTTTTCTACCATGGGCTTTTCCAAATCCGCTG +CATGCATTTTTATTAAGTTACCTAAGCAAACGTGGACGGAGAAGAGGGTCAGGGACTATC +CTGAAATGGTGAGAGGACGTGCTTATGTGAACAGATACTTCACAAAAGAGGAGATCCACA +TGCTAATTACACAGATGAACACAGTTCAATGTTCAAAATAAAACTATAATATGGGCCAGG +TGTGGTGGCTTACGCCTGTTATCCCAGCACTTTAGGAGGCCAAGGCAGGGGGATCACATG +AGGCTAGGAGTTCAGGACTGGTCTGGACAACATGGTAAAACCCTGTTTCTACTAAAAATA +CAAAAATTAGCCGGGTGTGGTGGCATATCTGTCATCCCAGCTACTTGGGAGGCTGAGGCA +CGAGAATCCCTTTAGCCCGGGAGGCAGAGGTTGCAGTGAGCCAAGATGCCACCACTGCTC +TCCAGCCTGGGTGACAGAGCAACACTCTGTCTCAAAAAAAAAAAAAAAAAAAAAAAAAAC +CACAACACAATGCAATATGGCCATATACTCACCAGAATGGTAAAATTAAAAAAACAACAA +ATGCTCACAAAGATCAGGATCAAGAGGAATGCCTGAATACCTCTGGTAGGAATGAACCTG +GTACAGCTGCTTTGAAAAGTTCTCTGGGAATACCTCCTAAATCTGAATGTATGCACACCT +GCAACCCAGCATAGCTACTCCTATCAGAAGTGCCTATTGGCCGGCACAGTGGCTCACGCC +TGTAATCCTAGCCCTTTGAGGTCAGGAGTTCAAGACCAGCCTGACCAACATGGTGAAACC +TCATCTCTACTAAAAATACAAAAAAAAAATTAGCAGGGCATAGTGGAATGCACTTATAAT +CCCAGCTACTAGGGAGAATGAGAATGAGGCAGGAGAATCACTTGAACCTGGAAGGCAGGG +TTGCAGCGAGCCAAGATCACTCCACTGCACTCCAGCCTGGGCGACAGAGTGAGACTCCCT +CTCAAAAAAAAGAAAGAAGTGCCTATCTATGCTCGTCAAAAAGACGTGGATGAGGATGTT +CATGACAGCATTCTTCATTATAGCCCCAAACTGGAAACAATTCAAATATTCACAAATGAT +GATATCTGACTATAATGGAACACTGTATAGCGAACGAATAAATGAATTTTGCCACATGAC +TTGGGTGAATCTCACAAACAAAATAATGAGAGAAAGAAACAAATCACAGAAAAGGACAGA +CTGAATAACTTCAAATTAAAAACAGATTAAACTATACCGTTTTGGGTTTTTTTTGTTTGT +TTGTCTGTTTTTTTGAGACGGAGTCTCGCTTTGTCACCCAGGCTGGAGTGCAGTGGCACA +ATCTTGGCTCACTGCAAGCCCCTCCTCCCGGGTTCACGCCATTCTCCTGAGTCAGCCTCC +TGAGTAGCTGGGACTACAGGCGCCCGCCACCACGCCCGGCTAATTTTTTGTATTTTTAGT +AGAGACAGAGTTTCACCGTGTTAGATAGTCTCGATCTCCTGACCTCGTGAGCCGCCCGCC +TTGGCCTCCCAAAGTACTGGGATTACAAGCATGAGCCGCTGCGCCTGGCCTAAATTCTAC +TGTTAGAAGTCAGGAAATCCCAGCATTTTCAGAGGCCAAGGCTAGAGGACTGCTTGAGCT +CAAGAGTTTGAGACCAGCCTGGGCATCATGGAGAAACCCCATCTCTAATGACAATACAAA +CATTAGCCAGGTGTGGTGGTGGGCGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGG +AGAATCTCTTGAACGTGGGAGGCTTCAAGGTTGCAGTGAGCTGAGATCGCATCATTGCAC +TCCAGCCTGGGTGACAAGAGCGAAACTCCATCTCAAAAAAACAGACATGACAAGGGAGTT +AAAAATGCAGTCACTGCAGACTTCTTCTAATCATATATCTTATATGACTTCATCCGTTTA +CAGTTTACAAAAAACTAGAGGTACTTGGAGGCAGCTACTTGGGAGGCTGAGGCAGGAAGA +TGGCCTGAGCCCAGGAGTGTGATGCTGCAGTGAGCTACAATGGCACCACTGCAGTCCAGC +CTGGGTGACAGAGCAAGTCCCTGTCTCAAAAAAGAATTAAAAATGATAAAATAATATAAG +AGACTTTGTTTTCATGTCAAAAAAAAGTTTACTTGGAAAAAATAAGGAAACACATTAGCT +AAAAGCTTTAGAAGCTGTTTGTACACTGTATTTTTCTTACCTTCAACATCCAGCAGTGGC +TGCTGACTGACATTTAGCTTGTTGACATCACTATCAAACATTCCTATCAAAGAGGTCTTT +AAAACTGCCAACAAAAGCTTTTCCTCTTGTAGCAAAATTTGCCTTTTATCTGGAGTAACA +TTGATATCAACGCATTCTAAGGCAAAAAAGAAAACATATTTATTATGTTTAAATTCACTT +TTATTTTATTTATTAATTATTATTTTCAGACAGCGTCTCACTCTGTCGCCTAGGCTGGAG +TGCAGTGGCGCGATCTCAGCTCACTGCAACCTCCGCCTCCTGGGTTCAAGTGATTCTCCC +TGCCTCAGCCTCCGAAGTAGCTAGGATTACAGGCAAGTGCCACCACACTGGCTAATTTTT +GTATTTTTAGTAGAGATGGGGTTTCACCGTGTTGGCCAGGCTGGTCTCGAACTCACAACC +TCAAGTGATCCACCCGCCTTGGCCTCCCAAAGTTCTGGGATTACAGGCGTGAGCCACCGC +GCCCAGCCAAATTCACTTTTAACAATAGAAATTTCCCCATCTATTATTTCATTCACTTGT +ATTTATCACAAGTGCTATTAAAAACATTACAGTGTCCAGGTTAAGATTCATAAGTTATGA +AATCAGCTTTTTCAAATAAATGAGCAAAAGACAATTTTTGAATAGACAAAATACGGAAGG +GCTTAATTAGGTAAATTGTTAAAGGAAAAGCAAATAAACACATAAAAATAATTTTAAATA +TGCAAACTAAAATAAGATATTTTAATCCCCTACTGAATTTAGCTTAACAATTATAATACC +TAGTACATTATAGGTAGGTGTGTAAATTGGTACATCTAGAACACAATACAGAAAAAGCCT +TAAAATGATCATATTCACTGACCCAGTAATTCTACTCCCGGCAATTTATATTCAGAATAA +TTAAAGATGTAGGCTGAGTGCAGTGGCTCACACCCTGTAATCCCAGCACTTTGGGAGGCT +GAGACGAACAGATAAGTTAAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGCGAAAC +CCCGTCTCTACTAAAAACACAAAAAATTAGTCAGGCATGGTGGCAGGTGCCTGTAATCCG +TGCTACTCAGGAGGCTGAGGCGGGAGAATCGCTTGAACTCAGGAATCGGAGGTTACAGTG +AGCTGATATTACACCACTGCACTCCAGCTTGGGAGACAGAGCAAGACTCTGTCTCAAAAA +ATATCTAATAATAAAGATGCAGATAATGATTTAATTATAAGGAAAGTATTTATAATTTCC +AAAAACTAAAAACAATTTAATTTTGAAAAATTTAAAAATTAAAATACCAAACTATAACCA +TGCATTGGAATATAATTCACCTATTAAAACCACATTTCTGATCAATTTCTAATAACATGG +AAAAGAAAACATTCACATCTAAGGATAAAGAGCAGTATACAAAATTATTTTCTCATCCCA +AAGAATATGGGAGTAGGGGAGAGAGAGAGAAAGAGAGAGAGGACAGAAGATATTTTTTAA +GGTATGTACATATGTGTTTCTAAGTATCTAGAAAAAATACTCAATTACAATAAACCAAAA +TTTTAACAATCAGAAAAAAAAATCTATATGAAATGAATTATTTATGAAATTAGGAAGAAC +ATTTCATCTACTTTCTCCCTTGGTTGACATTAAAAAAAATTACATTTTCCTAACAATATA +ATTAACATAGTCTCAAGTAGAAAGCGGGAACTCTGTTTAAAAAAAAAAAAAATTATAGGG +CCAGGCACGGTGGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCCAAGACGGGCAGATC +ACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACGGTGAAACCCTGTCTCTACTAAAA +ATACAAAAAATTAGCCAGGTGTGGTGGCACGCACCTGTAGTCCCAGCTACTTGGGAGGCT +GAGTCAGGAGAATCGCTTGAACCCGGGAGGCAGAGGTTGCAGTGAGCCGAGATCACGCCA +CCACACTCCAGCCTGGGTGACAGAGCAAGACCCCGTCTCAAAAAAAAACAAAAACAAAAA +ACTTACATGACCATAAATTGTTATCTCATTCCAGTCATAGCAGAGCTGTAGAATTTCATT +TTATTCTTTGAGGCATTAGTCACTAGTTGTACTGAAATGCCAATGGAACTTACCTGAATC +AACAGAAATGTTAAGAACAACAAATGGATACTGGTGTCGATTATACATGTGGTAGACCTC +ATTCACGAGTCTGCAGACCTGCACAAAATACAAGGAGTAGAAAAGAATAAATGACAAATG +TTCCCAGCCCCCCGCATTCTAACAACATTCTATTCTAACCAACCAGCATGTTCTTAGAAG +GGGATACTTTTTTGTTTTTTTTTTTTTTGAGTCAAGGTCTCGCCTTGTCACAGCCTGGAG +TGCAGTGGAGCAATCATGGCTCACTGCAGCCTCAACCTCCCAGGCTCAAGTGATCCTCCT +GTGTCAGCCTGACATGTAACTTGGATTACAGGCAGGATTTTTTTTTCTTTTTTTTTTTCA +ACGGAGTCTCGCTCTTGTTACCCAGACTGGAGTGTAATGGCACGATCTTGGCTCACTGCA +ACCTCTGCCTCCGGGGCTCAAGTGATTATCCTGACTCAGCCTCCAGAGTAGCTGGGATTA +CAGGCACACGCCACCATGACCAGATAATTTTTGTGTTTTTAGTAGAGATGGGGTTTCACC +ATGTTGGCCAGGCTGGTCTCGAACTCCTGACCTCAGTTGATCCGCCCGCCTCAACCTCCC +AAAGTGCTGGGATTATAGGCGTAAGCCACTACACCTGGCCTAAGGATACATTTTTTTAAC +AGCTTTACTGAGATATGACTAACATGGAATAAACTACACATATTTAAAGTGTGCAATTTC +ATAAGTTTTGACATATACACAAACACCTGTGAAACTATCCCCACAATCAAGATAATGAAT +ATATCCATCACCAAAAGTTTCCTCACAATCTCAAAGTGATATTTCTCTAATCATAGATTC +CTAAAACTGAATATTTTTCCAACTTAAAGTTGCTCTATGAGAAATTCTAGTGAAATGCAA +GTGCAGCTTAAATGTTCATAAAACATATTCAATGTACATAGAAAAGTATCTATGACATTA +AAATGTCATTAGAAATAAACCAAAATATCACATTATTAATAGTTATAATTAATAATTATG +AATCCATCACACTATAGGTTAAAAAATTTAGAAGTTCAACCACATCTGGCAGATTACAAG +CAAACTCTAAAGCATCATTGAAAAACAGGGGCTGGGAGCGGTGGCTCACGCCTGTAATCC +CAGCACTTTGGGAGGTCAAGGCAGGTGGATTGCCTGAGCTCAGGAGTTCTTGACTAGCCT +GGGCAACACAGTGAAACCCCATCTCTACTCAAATACAAAAAATTAGCCAGGCATGGCAGC +ATGTGCCTATAATCCCAGCTACTTGAGAGGCTGAGGCAGGAGAATTGCTTGAACCTGGGA +GGGAGAGCTTGCAGTGAGCCAAGATCACGTCACTGCACTCTAGCCTGGGCGACAGAGCTA +GACTCCGTCTCAAAAAAAAAAAAAAAAAAAAGAAAGAAAGAAAAAAAAACAAAATATTAC +TGAGGTACAATGTGTTGCTAAGATACAAACTCAAAAAACCCATGTCATCATATCAAGATG +ATCAATTTAAATCTGAGGCAGAAGTAATCTGAGCCCTTATTTTCCTAGGAAAATAGAAAG +AAGAGAAAATATAGAAATCTATAGAAAATATAGAAACCATGGGCCGGGCGCGGTGGCTCA +TGCCTGTAATCCCAGCACTTTGGGAGACAGAGGCGGGTGGATCACGAGGTCAGGAGTTCG +AGACCAGCCTGGCCAATGTGGTGAAACCCCGTATCTACTAAAAATACAAAAATTAGCCGG +GTGTGGTGATGCGTGCCTGTAGTCCTAGCTACTAGAGAGGCTGGGGCAGGAGAATGGCGT +GAACCTGGGAGGCGGTGCTTGCAGTGAGCAGAGATCATGCCACTGCACTCCAGCCTGGGG +GTGACAGAGCGAGACTCTGTCTCAAAAAAAAAAAAAAAAAAAAAAAAAGGAAATATAGAA +ACCATGTAATCAGTCTATACTGAAAGGTGACATAGAATGTTATAAAATGTTTAGTTTCTT +CAAATAGTTTTAGTTTTTACAATAATAAATATACTGGTAATATGTGTTTATATATTTATG +TATCTATACACACAACACATATAATGTATATATGCAGATACAAACACACTCACGTATATG +CAATTTAAAAAACTATACAGAGGCCAGGCGCGGTGGTTCACGCCTGTAATCCCAGCACTT +CGGGAGGCCAAGGCAGGCAGATCACGAGGTCAGGATTTCAAGACCATCCTGGCCACATGG +TGAAATTCCGTCTCTACTAAAGACACAAAAACTTAGCCGGGCGTGGTGGCGCGCGCCTGT +AATCCCAGCTACTTGGGAGGCTGAGGCAGGAGAATCGCTTGAACTCGGGAGGTGGAGGTT +GCAGTGAGCCAAAATCGCACCATTGCACTCCAGACTGGCCAACAGGGCGAGACTCCATCT +CAAAAAAAAACCCAAAAAACAACAACAAAAAAAACTGTACACAGATAGATGCGCTCCTTA +ACTTATGATAGGGTTATGTCCTGATAAACCCATAAGTTAAAAATATTGTATCTGCTGGGC +GCGGTGGCTCACACCTGTAATTCCAGCACTTTGGGAGGCCGAGGTGGGCGGATCACGAGG +TCAGGAGATCAAAACCATCCTGGCTAACAAGGTGAAACCCCGTCTCTACTAAAAATACAA +AAAAAAATTAACCAGGCGTGGTGGCAGGCACCTGTAGTCCCAGCTACTCGGGAGGCTGAG +GCAGGAGAATGGCGTGAACCTGGGAGGCGGAGCTTGCAGTGAGCCGAGACCACGCCACTG +CACTCCAGCCTGGGTGACAAACAAGACTCCGTCTCAGAAAAAAAAAAAGAAAGAAAAGAA +AATACTGTATGTCAAAAATGCCTTTGTGATAACCTAACCTACTGAATGTCCCATCTCAGC +CTTGCCTCAGAATACTTACATAGTCTATAGGCAAAATAACCTATTTTATAATAAAATGTT +GAATATCTTCTGTAATTTATTGAATACTATACCGAAAAACAATGGTTCAATAGGTACTTG +AAGTATGGTATCTACTGCAAAAAATAACTTCTGCAACAAGGTAAAGTAGTAGAAAAAAAT +ATATATATATTTTTTTGAAACACAGTCTCGCTCTGTCACCCAGGCTGGAGTGCAGTGGCA +TAATCTCGGCTTACTGCAAGCTCCATCTCCCAGGTTCAAGTGATCCTCCTGCCTCAGCCT +CCCATGTAGCTGGGATTACAGGCGTGGAACACCATGCCTGGTTATTTTTTGTATTTTAGT +AGAGACGGGGTTTTGTCATGTTGGCCAGGCTGGTCTCGAACTCCTGGCCTCAGGCAATCC +ACCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACTGCGCCCGGACAGA +AAAGTCTTCAGTTGAAACATCTGAAGCTGGGGGCCATCTGCGGTAGACTTCTGTAAATGC +ACAAAATAAGATAATGTTAAAGCCATGTTTCTCAAAGTCCCGAGCTCCACGTAAACTGCC +TATTATCAGAAAAAAGTTATCAATTAAAAGTCAAAGGCATAAAGAACAAACTAACACAAA +AAAATTTTAAATACCTTTGCTGGGTCACAAGGCCGCCGGTTGATAAAGAAAAACTGTCTG +TCTGTTGAACTCCTTCCAACTCCATGCGTGCATTGTGAAATGAAACCTGAGATGCTATTC +AACATTAATATGGTAAGGGCAGGATTCCAGAGTGAAAGGGATTAGAAATACGATCACATG +GCACATTCTTAAAGTGAAATGAAAACAAAACACCAGGTGACATGCTGATAAGGATCACTA +TTGCAGTTCACGGGTATCTGTGCTCCAAATCTTGATGAGTCATCAAAGAACCAAACCTTC +TGGAATATTCTAAAGCTCCTACAGTCAACCAATGCACCACAGGTGATGCAGTGCGTCCAA +AACTGATGTGTTGCAGCTCTCCTTACCCTTCCTGATAAATCCTCAGCCTCTGTAAGTGGG +TCTCGCTTCAAATGCATTCTCAGAACCTCCGTGCTGCCACCCCTGGTTTGTCAATGAAGT +CTAACCACTTGTGCTCAGAATTTTGCCCACATTCCCTCCCCTTTCAAAACCTCCCGGGTA +GGACGCTTATATCTCATGTCTTGGTAAAGCGCTTGCTTCACATGAGACCCACCCCAGGGA +TACCGGCATTTCCAGAAGAACACCACCTTCACATAAAGACATAAAGCTCCATGTTTACCA +TTTCAGGCATAAGCCAAAAGCAAGTGGAGGAAGAGTAAGAAATATAGATCTCAAGGCAAC +AAACAAACAAACAAAAAGAAATACAGATCTTAGGCTGGGTGTGGTGGCTCATGCCTGTAA +TTCCAGAGCCTTGAGAGGCCAAGGTGGGTGGATCACCTGAGGTCAGGAGTTCAAGACCAG +CCTGGGCAACATGGCGAAACCCCGTCTCCACTAAAAATACAAAAAATCAGCCGGGCATGG +TGGTGAACACCTGTAGTCCCAGCTTCTCGGAAGGCTGAGGCAGGAGTATCGCTTGAACCT +GGGAGGCAGAGGTTGCAGGGAGGCAGAGGTTGCAGTGAGCCAAGATCACGGCACTGCACT +GCAGCCTAGGCAACAAAGCAAGACTCCATCTCAAAGCTAAAAAAAAAAAAAATATATATA +TATATATATATATACACACAGATAGATAGATATCTTTACAGGACCAATCCTATTTATGGA +AGTGTCTATTTTCTTATACGAAAAGTAATGACACTGAACTGCCTTCATCAGATGCCAGGA +AAGTCAAAATCATTTAAAATGATAAAATAATTTACAAGTTAGTCTAACTAAACAGAGCCT +TAAAGAAGACCTGCTCAACAGAAAACCACCTGAAATATACCACTTACTCAAAACATGGTT +TGAATTAAGCAACTGACTCCTTTGTATAAATCATCTTTCTTAGCCACAGCATTGCTCACA +GTTTTATAAAGGACATAAAAAACTATTATCCCTAGCCAGGCGTGGTGGCTCATGCCTGTA +ATCCCAGCACTTTGGGACACCAAGGTGGGCGGATCATCTGAGGTCAGGAGTTCGAGACCA +GCCTGGCCAACATGGTGAAACCCCGTCTCTACTAAAAATACAAAATTAGCCGGGTGTGGT +GGCACGTGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATTGCTTGAACTCA +GGAGGTAGAGGTTGCAGTGAGCCAAGATAGCACCATTGCACTCCAGCCTGGGCAACAAAG +CAAGACTCCGTCTCAAGAAAAAAAAAAAAAGACACGAAACTATTAGCCTTAGAATCACTA +TCTTTAAAAAAAAAGCTCTCAGGATAAAATGTTCAATTGTAGTTCTCTTGCCAGCAATCT +ACTTACTAAAAAAGATTATGCAGAGCATCGGAACAGCTCAAACCGTACTCTTCACACACG +GAGTCACTAGGGGGCAGCTGAACAAAAGGAATGAGGCTTTGCAACTGAAAAAAAAAAAAA +AAAATTCACAGTTACTTCCTAATAAAGACAGAGTGGACTTAATCTGTTTTCTTTCTTAGT +CAAGCTATTGACATTACAAGCGCAAAAAAAATTAAAAGAATCTTTTGTTTTGTTTTGTTT +TTTGAGACAGGGTCTCCCTCTATTGCCCAGGCTGGAGTACAATGGCTCAATCATACCTCA +CTGCAATGTCAAACTCGTGGGTTCAAGCAATCCTCCTGCGTCAGCCTGTCGAGTGAGTAG +CTGGGACTACAGGTGCACACCACCACACCTGGCTAATTTTTTAATTTTTTTGTAGAGATG +GGATCTTGCCGTGTTATCCAAGCTGGTCTTAAATTCCTGGGCTCAAGCGATTCTCCCACC +TCAAAATTGTTGGCCGGGTGGTTCAAACACATAATCCCAACAGTTTCCTCTCCCAGAGTG +CTGGGATTACATGTGTGAGCCGTGGGAACAACAATTTTGATTTTATGATATAAGAAAGAT +GAAACAAGTACCTACTTATTCAGAACCCACACATTGCCCACAATAACTTATATTTTTTTC +AGAGAGAGAGTGAAAAGACGCAGTATACGAGTGTCTCTGGAAGAATAAAATGAAACACAT +TCAGCTCTCAAACATCAATTTTTGTGATAGGTACTTTGTTTTTTTTTTTTTTTTTTTCCT +GGGATGGTGTCTTGCTCTCTCGCCCAGGCTGCAGTGCAGTGGTGCAATCTCAGCTCACTG +CAACCTCCATCTCCCGGGTTCCAGCGACTCTCCTGCCTCAGCCTCCTGAGTAGCTGGGAT +TACAGGTGCCTGCCACCACGAACAGATAATTTTTGTATTTTTAGTAGAGATGGGGTTTCA +CCATATTGATCAGGCTGGTCTCAAACTCCTGACCTCGTGATCCGCCCACCTCAGCCTCCC +AAAGTGCTGGGATTACAGACGTGAGCCACTGCGCCGGGCCTTGTGATAGGCACTTTAAAA +ATCAATTCTTAATCTGGGCGCAGTGGCTCACGTCTGTAATCCCAGCACTTTGGGAGGCCG +AGGCAGGCGGATCACTAGAGGTCAGGAGTTCGAGGCCAGTCTGGCCAACAAGATGAAACC +CCATCTCTACTAAAAATACAAAAAATTAGCTGGGCCTGGTGGCATGTGCCTGTAATCCCA +GCTACTCAGGAGGCTAAGGTAGGAGAATTGCTTCAACGCGGGAGGCAGAGGTTGCAGTGA +GCCAAGATGGCGCCACTGCACTCCAACCTGGGCAACAGAGCAAGACTCCAGCTCAAAAAA +AAAAAAAACCGGCCGGGCTTGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGA +GGCTGGTGGATCACGAGGTCAGGAATTCGAGACCAGCCTGGCCAACACGGTGAAACCCCG +TCTCTACTAAAGATACAAAAAATTAGCCTGGCGTAGTGGAGCATGCTTGTAATCCCACTA +CTCGGGAGGCTGAGGCAGGAGAATTGCTTGAATCTGGGAGGCGGAGGTTGCAGTGAGCCA +AGACAACACCACTGCACTCCAGCCTGGGCAGCAGTGCGAGACTCCCTCTCAAAAAAAAAA +AAAAAATCAATTCTAAGATTTTATTCTCCATTCTACTGGAAGGGACAATGGAAACCCGCT +ATAATCACTAGAGCAATAAGAGGCGTTGAAGTAACCGGCCATCACTACCTGCTTCTGCCC +AAACACAGAGCCGATATTTTCCTTTATGCTGGGGCTTCCACCTGTGCATACCACAGGCTG +TCGTTTTCCTTGTCCAAGCTGATTGGTGCAACTTACACGGATGCCTGCTGAAATGATACA +GTATGCATGTAAGACCTGGACCATTTTGGCATACTCCTGTTTAAAAAACACAAACACAAT +ATTCTACATTACTTTAATATTATAGGAATTACACAGCTCAAGTTACAACATCCAACGCAA +GGTTCTCACATCATCGCACAAATCAAGGGAAGCACTGTTGACAGAATGATCTGTAAAGAG +GTGTCTTCCTATATTCTACAGAAAGGAACGCAGAGCTTTTGGCTCCTGGTCACAGTCCTC +TCACTTCCCAATGTGCCATGCATCCTGGTAAAACAACTAAAAAGTACAGCCTGTAATCCC +AGCTACTCAGGAGGCTGAGGGCAGGAGGATCACTTGAGACCAGGAGTTCAAGACCAGCCT +GGGCAACACAGCAAGACCCTGTCTCTACAAAAAATTTAAAAAAAAAATTAGCCGGGCGTC +ATGGCATGTGCCTGTAGTCACAGCTACTGAGGAGGCTGAGGTGGGAGGATCGCTTGAGCC +TAGGAGTTCAAGGCTGCAGTGAGCCATGATTGCACCACTGCACTCCAGCCTCGGTGACAG +AGTGAGGCCCTATCTCTAAAAATGAAAATTAAAAAACTGAAACGTACATTGTGTTTGATT +TTATAATCTCTCCTTTTGAAATGTATCTTCGTATAATAGAAACACTGGCACAAGCATTTT +GGTATGCAAAGAGATACACAAAAATGTTCACTGAAACAATCTCTATGAACAAACAGAAAC +AACCTAAGCAAGCATCATTGAGGAGTTGATTAATTATGGTATAGCCATAGCGCAGCAGAA +TGACAACAAATAAGGCAGTGTGCACCGACTAAAAAAGACAATCACAATATGCTAAGTAAA +AAGTCAGTTATAGGGCCAGGCATGATGGTTCACACCTGTAATCCCAGCACTTTGGGAGGC +TGAGGCGGGAGGATCACTTGAGCCCACGAGTTCGAGACCTGCCTGGGCAACACAGAAGGA +CCCATCTCTACAAAAAAAACAAAAATTAGCCGGGCATGGTAGCACGGGCCTGGAGTCCCA +GCTACTTGGGAGGCTGAAGTGGGAAGATTCATTGAGCCTGGGAGATCATGGCTGCGGTAA +GCTGAGATTGTGCCACTACATCCCAGCCTAGGTGAGAGAGCAAGACCCTGTCTCAATTAA +AAAAAAAAAAAAAAAAAAAATACAACTTTCAACCACATACAATTCTGTATTACTTGCATG +TTGTACATTCTATATTACTTGCTTTCATTATATTAACTTATGAATTTATCTTGAAAATTA +TTCCAACAGTTATAAACACATGAAATTAAAAGCAGCCTGAAAAGATATACAAACTGTAAA +TAACAGTTATCTCTGACAAATAGAAGTTCTACATTCCTGTATTCTGCTAAGGCACTAATT +TTTTTACCATAAGATACAAAAAAAGAGTAAGTTTTCTCTACTTTAGAAAATTTAAATTTG +TGAAAAAATGTAATAAAGTTAAAATTAGCAGCCAAGTGCAGTGGCTCACACCTGTAATCC +CAGCACTTTGGGAGGCTGAGGCAGGTGGATCACTTGAGGTCAGGGGTGCAAGACCAGGCT +AGCCAACATGGTGAAACTCCATCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGC +GCACACCTATAATCCCAGCTACTCGAGAGGCTGAGGCAGGAGAATCACTTGAACCCAGGA +GGTGGAGGTTGCAGTGAGCCGAGATCGCACCACTGCACTCCAGCCTGGGCGACAGAGTGA +GAAGACTCCATCTAAAAAAAAAGAAAGTTAAAATTAGCACCAAATGCTTTACAAGTAAAA +AAAGTTTTTAGCTGCATATGTTTAAGTAACTTTTTAGATTATGAAAAACACACATACAAA +ATGGGAAGGCACAAAGAAGACAGCAAAAACTGCATGAGATCTCACATCCAAGGATAACTG +CTGAGAACATGAAAGTGCCGAGTCTTCCAGCCTTTATACTATACACATTTAGGCTTGTTG +TTTTGTTTTCACAAAATTGTAATCAAATAATACAGACAGTTCTATAATCTGCTTTTTAAA +CACAACGACTATATAACATTTAGCTATTTTCATTTGCATTCAAATTCATAAGGGTTCTAA +TAGCTCATTTCTCAGAAAACCAAGAGAAATATTCTTTTTTTTTTTTTTTTGAGATGGGGT +CTGGCTCTGTGCCCAGGCTGGAGTGCAATAGCTTGATCTCGGCTCACCGCAACCTCTGCC +TCCCGGATTCCAGCGATTCTCCTGCCTCAGCCTCCCAAGGAGCTGGGACTACAGGCACAT +GCCACCATGCCCAGCTAATTTTTGTATTTTTAGTAGAGATGGGGTTTCACCAGTTTGGCC +AGGATGGCTTTGATCTCTTGACCTCGTGATCCACCCGCCTCAGCCTCCCAAAGTGCTGGG +ATTACAGGTGTGAGCCACTGTGCCTGGCCGAGAAATATTCTTATTAAAATATAAGTACAT +AAGGCCAGGCATGGTGGCTCAGGCCTGTAATCCCAGCACTTTGAGAGGCCAAGGTGGGCA +GATCACCTGAGGTCAGGAATTCGAGACCAGCCTGGCCAGCCTGGACAACATGGTGAAACC +CCGTCTCTACTAAAAATACAAAAATTAGCCAGCTGTGGTGGTACACGCCTGTAATTGCAG +CTACTCAGAAGGCTGAGGCAGGAGAATCGCTTGAACTCAGGAGGTGGAGGTTGCAGTGAA +CCAAGATCGCGCCACCGCACTCCAGCCAGGGCGCCAAAGAGAAACTCCATCTCAAAAAAA +GATAAAAATAAAAAATAAAAAATATATATATATGTATATATATTTTTCCAGACAGGATCT +TATTCTGTCTCCCAGTCTTAAGTGCAGTGGCGCAATCATAGCTCACTGCAGCCTCAAGTT +CCTGGGCTCAAGTGATCCTCCCACTTCAGCCTCCCAAGTAGCTGGAACTACAGGTACATG +TCACCATGCCCAGTAAATTTTTTTTTAAAATTTTTCATAGAGACAGGGTCTCACTGTGTT +GCCCAGTCCTAATAAACACTATGTGATGAAAAGAAAAAAGTAAATCATCCTAAAGTTAAG +TCTTTAATGTTAAATCTTTAATGAGAAATGCAAATAAAGCATTTCTCAATAATTTATGGG +AAGAGAATCAACTGAAGAATAAACATCTTTAGTAAATCTTTTGCTCATGTGCATTAACCA +ATACTCTTGAAAACCAGGATTAATTTACTGTACCTTCTTAATATTCCTTTGAAATTCCTT +ATGGCGCACAGGTAGTGTGGAAAATAACTGCTGCACGCTGACTGTGGTCCCTCTGGGGCG +GGGGTAGGGGGTTTTCTGGATAATTTTCCCATTGTGATCAAACATCAGTCGAGTTCCAAC +CTTCGCCGATGCGTGGCAGGTAGAAATGGTGACATCGCTGTGAGAGAATACCAGGCATGG +TGTGTTCAGTGAGAGACCCATGATGTTGGGCACTGACTACTCTTTTCTTCACTTGCTTTT +CTCTCAAAATTTTCTTAAAAAGCTGACGATCCCTCTGAGATAATCAAGATCTAAATGGTT +GAGGAGTCATCATAAAATCTAAGGTTTGGCATCTAAAAGACAGTGAGACAGAGAGCACTA +AACATGCTTTGCTTTGATAAAAGCTTTGATTTCGTTTTTCAGGTTGAACTGCAAAACCAT +AAATGATCTTAAGATTTATTTATTCACAAACACAGATTTGTTTTGTTATTACTCTTCGAA +CAAATTTTTTTTAAAGAATCTAACAAATATTATAATTAAAATGTATATGTAGGGCAGAGC +GTGGTGGCTCATGCCTGTTATCCCAGCACTTTGGGAGGCCAAGGCAGGCAGATCACTTGA +GGCCAGGAGTTTGAGACCAGCCTAGGCAACATGGTGAAATCCCATCTCTACTAAAAATAC +AAAAATTAGCCAGGAGTGGTGGTGCATGCCTATAGTACCAGCTCCTCAGGAGGCTCAGGC +ACGAGAATCACTTGAACCTGGAAGGCAGAGATTGCAGTGAGCCGAGACTGTGCCACTGCA +CTCCAGCCTGGGTGACAAAGAGAGACTCTGTCTAAAAAAAAAAAAAGATATATATATATA +TATATAATTATTTATAAAAATTTCATATCTGTGCTATAATTAAATAGTGCTTTGGTGAAA +TGTTTCCCTAAAAATTGATAATGAAAACCAATGGTAACTATCATTTATTATCTACATGTT +AGGTTAAAATTGAGAATTACTGTTTTAATAAGGGTAACCATCTTTTTAACAATACTATTT +GCTTCATTTCATTCATTTATTGCTCACATTTCAGAAGTACTATGACTTAGATTGGCAGCG +AGACAAAACAGAATTCAGAAGCTAGAAGTTGAGATGTTGAGATAGAAAACTGAAAATAAT +AATGATTCCAATTAATTTTCAGAGAGGTTTCTCTAAGGGGTCAAGTGAGTGGATAAAAAT +ATTGTATCACCTCAGTGCACAAAGTGAGCTCAGAGCTTCCCCCCGAAAGCCAAAAGTTTC +AACCTGAGTTAGGTCGGCAAACTCTTGAATCTTAGATGTGTGATGTTTCAGAGCTGAAAG +AGAGTGTAAAGTAAGGACTAAGATATCTCAAGTGCTATAACAACAAAATATACATGATAT +CTAGTAACTGGCTTTAAAAAACTGTTTTTGCATTTCCCAAGACAGTGTTACTCAAAATTC +TGAGACATGTGACCCAATTATTTTATAATAGGATTAGAAAAAGTCAACTTACTTAAGCCT +TCGAAGTTTTCTTCTTCTACCCCACATCCATTGTCTGAAACTTCAATAAGATCCACTCCA +TAGTCCTTAAGCTTTAGATCTAGAAAGTTTAAAATATTTACATATTTATTAAAAACGGAC +CCATGCTATCAGTTTTTATATTGACATTATTTATAACATATGCAAATTTAAGAGTCATAA +CTATACCTTTAGTTAAACATACTAGTGTCATTTTGTATATTTCATTGTTATAAAGTCCTT +TCTGGCTATTTACTAGCCCAGACTAAATAGTTTAGCTTTTTCTTTCTTTCCTCTTTTTTT +TTCCCTAGGCTAGTGAAGTGAAGCAGTTGGAGTGGAGAAGGAACAAAAAAAATCTGTAAC +TGGTGGTGATCAATTAGCTGTAAACCGCGTTGCACTTTGACCATCCTTTTCTTTTGAAAG +AAATAATTTTAACATACCCAATAAAGAGAACGGGGACCGGGTGCAGTGGTTCATGCCTGT +AATTCCAGCACTTTGGGAGGCCAAAGCGAGCAGATCACCTGAGGTCAGGAGTTCGAGACC +AGCCTGACCAACATGGAGAAACCCTGTCTCTACTAAAAATACAAAATTAGCCAGGCTTGG +TGGCGCATGCCTGTCATCCCAGCTACTCAGGAAGCTGAGGCAGGAGAATCACTTGAACCC +AGGAGGTGGAGGTTGCAGTGAGCCGAGATCGTGCCATTGCACTATAGCCTGGGCAACAAG +AGCAAAACTCTATCTCAAAAAAAAAAAAAAAAAGAGAATGGGTTCTGGAATCAGACTTCC +TGGATCCTATTTTATCAGCTTTATAATCTCAAAAAAAGGAAATTTCCTATCCCCTAATTT +CCTCATTTGTAAAATAGAGAATAATAAGTTCTATCTCATAAAGTTATTCTGCAGATTAAT +AATTCTTTGGTTTTTTTTATTTTATTATTCTTTTCTTTTCTTTTGAGATGGAGTTTTGCT +CGTCACCCAGGCTGGAGTGCAGTGGTACGATCTTGGCTCACTGCAGCCTCCACCTCCCAG +GTTCAAGCAATTCTCCTCCTTCAGCGTCCTGAGGAGCTGAGATTACAGCCATGCACCACC +ACATCTGGCTAATTTTTGTATTTTTAGTAGAGACAGGGTTTCATCATGTTGGTTAGGCTG +GTCTAGAACTCCTGACCTCAAATGATCAGCCCCCCTCAGCCTCCCAAAGTGCTGGTATTA +CAGATGTGAGCCACTACTCCAGCCCTATTTTGTTTTATGTTTTTGAGATGGAATCTTGCT +CTGTCCCCAGGCTGGCATGCAGTGGCACGATCTCGGCTTACTGCAACCTCCGTCTCTCGG +CTTCAAGCAATTCTCGTGCCTCAGTGTCCCAAGTAGCTGGGATTACAGGCTTCTGCCACC +AGGTCCAGCTAATTTTTGTATTTTTAGTAGAGACAGAGTTTCACCACTTTGGACAGGCTG +GTCTCGAACTCCTGACCTCAGGTATCCACCCGCCTTGGCCTCCCAAAGTGCTGGGATTAC +AGGCGTGAGCCACTATGCCTGGCCTACTTTATTTTTCAATAGAGACAAGGTCTCACCATG +TTGGCCAGGTTGGTCTTGAACTCTTGGCCTCAAGCAATTCCCCCACCTCGGCCTCTCAAA +GGGCTAGGATTATAGGCGTGAGACACCACGCCCAGCTGTTCTGCAAATTAAATATTTCTG +TGCAATTCTTAGCATAACACCTGCCTGGCACACCGTAAGAACACAATAAAAGCTGTTATT +ATTATTACTACCTAGCTAAGTACTAGGCACATAATAGGTGCTAACTTCAACTTAAAAATA +ATAATTTATTACTACATCAACACTTGATAGTCTTATTTCAATAACAAATGTTTCTTAACT +ACAACAACATTCACAGATCATTTCTTGTGGCTTAAAACTCTCCCAAACTTACCAATATTA +GTGGCACCAGCATCCAGACTGTTTTCTACTAACTCCTTTACCGCAGTGCTTAGACTCAGT +ACCACCTGCCCAGAGCAAATCTGATGGACTGACTTCCGATCAATAGGTTTGATGGCCTTA +GCAGGTTCTGTACTAGAGAAATCAGTTACAAGAAACAAATCAAGTATTCAGCTATATATT +TTCATCCTGATTTTAACTGTGGGAAATGACTCAACACTGTAAATAATTTATGGGTCTAAT +CTATTCATTTATTATATTAGCAAATACATTTATTATATCCAGAAATAGAAACACTGTTTT +ACAATCCTTAAACATGTACCCAAAATACTTCTGGATAGATACTTCAAATTCAACAGATCC +TTACTATCTAATTATACTAAGATCCACATGGAGAAAACATACATTGTATCTCTCAAATTA +CCAAAATCTTTGGCAACAATGGTGTCTTCTTTCTTGAAAAGTGAAAGCATGGCTGGCTGT +GGTGGCTCATGCCTGTAATCCCAGCACTTTGGGAAGCAGAGATGGGTGGATAACTTGAGG +TCAGGAGTTCGACACCAGCCTGGCCAACACGGTGAAACCCCGTCTTTACTAAAAATACAA +AAAATTAGCCAGGCATGGTGGTGGGCACCTGTAATCCTAGCTACTCAGGAGGCTGAGGCA +GGAGAATCGCTTAAATCCAGGAGGCGGAGGTTGCAGTGAGCTGAGATTGCGGCATTGCAC +TCCAGCCTGGGCAACGAGCAAAAAAAAAAATGAAAGTAACATAATTTCCCAACATAATTA +GAAAAACCAACAGTATGCTGGGAAATACACAATGTTTAAGTCAAAATCATCTCAGAAATT +GGGTACCAGTTATATAACTATTCCTTATACACAGTTGCCTTTGATACCCCACTCCAAACT +GAAGCTGCCAGCTGCTGTCTTAGCAAAGACCCTCAAAGCTCTTGCTGTACTAGCTTTAAG +AGTTTTATAAAGGTTTTATCTCCCCTTATTCCCTGCTCCAATACATCCTCCACTCTATCA +CCAGAGCTATTTTTGAAATCACAAATCTGGTCAAATAATTTTTCTGCTTAAAAATTTACT +AGTGCCCCACTTCCTACTATATGAAAGTTAAAATTTAGTCATCATTGGGGCCAAAACTAC +CTTCTTTTCAGAATCTCTCTAATCCTTTCCCTTCATCAAGTCCCCTACATTATTATTATT +ATTATTATTATTATTGTTATTATTGTTATTATTTGAGACAGAGTCTCACCCCGTTGCCTA +TGCTAGAGGGCAATGGCATGAGCTCAGCTCACTGCAACCTCCGCCTCCCAGGTTCAAGCG +ATTCTCCTATCTCAGCCTCCCAAGTAGCTGGGATTACAGGCGCCCACCATCACACCCAGC +TAATTTTTGTGTTTTTAGAAGAGATAGGGTTTCACCATGTTGGCCAGGCTGGTCTCGAAC +TCCTGACCTCAGGTGATCCGCCTGCCTCGGCCTCCCAAAGTGCTAGGATTACAGGGGACC +GCAACCAGCCATCCCCTATATTGTAGCACAGTGAACAACTGTCCTGAACATCACAAGCTC +TTTGAGACACTACAGTGTATAAGCAGGTCTCTGTCTAAACCGCTCTCCTCTTCCTCCTCT +GCCCAAACAATGTCTGCTCAAAGAATGTATCCCGTGTGTTCATTAACTTAGCAATTTCCA +GCAAACAGTTTAATTGATAACTTGTTAAGAGAAGGCAGGAAACCTCCATGAAAGAGAAAT +CACTGGGTATTTCCTACAGCATTTAACACATCGTAGGCCTTTAATAAACCCTTCTGAAAT +AAACAAACCTCTTTACTCTTCATTCCACCTTGCTAAGAATCTCACCTAAGTCTGTCTACC +ATGTGAAACTGCAGATGACCTCACAGAAAATGGAAAGAAGTATCTCTAAAAATAAGTTTA +TTTGGCAGCACACTATAGGCTACAGGTCCACTTCTGATTTTTTTTTTTTTTTTTTTTTGA +GACCGAGTCTTGCTGCGTTGCCCAGGCCGGACTGCAGTGGCACGATCTCAGCTCACTGCA +ACCTCCGCCTCCTGGGTTCCAGCGATTCTCCTGCCTCAGCCTCCAAAGTAGCTAGGATTA +CAGGCTCCCGCCATCATGCCCAGTTAATTTTTGTATTTTTAGTAGAAACGGATTTCACCA +TGTTGGCCAGGCTGGTCATGAACTCCTGACTTCATGATCCACCCGCCTTGGCCTCCCAAA +GTGCTGGGATTATAGGCGTGAGTCACCGCTCTCGGCCCACTTCAGATATTTATTTTGAGG +AGGGAGCGCATTTAGACACAGACCCCAAATTTATTTAAATGTCTCAATACATTTAAATGT +AGTTACCTAAATATATCTAATATATTTAAATGCAGAGAGCAAATTTGCGTTTACAAATCT +GACATGGAATGCAAATGTGCTAGCCAAGATTCGGTGTAGCTTACCAGCCAGAAATCACAC +ATCCTAACAGGTAGAAACGTATTGCATTTTTAAAAACTGCGCAGCTATGCAAATAAGGAT +GTGTCTGGACGCTCTACCGTCCCCAAAATAACCTTAATTTTTTAAAAAGGCCAGGCACGG +TGCATCATGCCTTTAATTCCAGCACTTTGAGGGGCCAAGGCGGGCGGATTGCTTGAGCTC +AGGCGTTCGAGACCAGCCTGGGCAACGCAGCGAAATCCCCGTCTCTACAAAAAAAAATTA +AAAATAAAATACTATAAAAATAAAAATAAAAGGGGAGAGAGAACAGGTAGAAAGGAAATG +CATTCAGTCTATGGGGATTTCACGCTCCCGCTTCAAGTCCACGGCCCTGTGATGGGATGT +GGGCAAGGCCTGTCTGGGACAGGCCGAACCCAACTCCTCACAGGGCCGAATCCTTTGCCC +GCAGCCCAGGACCCCGAAGGAGCTTGCCTCGGCCTCAAGGCGCACCCAAGGGGCACGAGA +TCGCTGCAACACTGAGGTCGCCACTCCGGGGCCTCCAGGGGGCTGCCTCGCCACGCGCCT +CGGCCATGTTCCCCCCATTTCCAGGGAGGTTGGAATGCCGTGGGTCTCAAAGAGGGCGCG +CGAGAGGGGACACCGGAAGACTGCGAGCCCCGCTCACCTCGAGCTCTCAGCTCGCTCCAT +GGATGCAACACCCGATCCGCCTCGGGGACTGGGAAAGTTCCCTCCAGGGCTCCCACAGGC +GCTCCGCCTCCTGAACTCCCATTGGCTGCTTTCGACGTTGTGCTCCACCCTTTCCGGGCG +GGGCGGCAAAAATACTTCCCGTCTCTCCTTTTCGCCTATTGGCTCTGTCAAAGGTCGACT +TCGTGACGTCAAAGAGCCTGGGCCAATCAGAGCACACCGGACTGCGTTTTCCCGAACGCC +CGCAGCAGGGTCAGAAGGGAGGTGGCCGGTCTCCGTCGTGACCTCTGACGGTTTCTGAGC +GTTGGCCTTTGGCACGCGCTACCCCCTTTTGCTTTGGTTCTGCCATGCCGATGTACCAGG +TAAAGCCCTATCACGGGGGCGGCGCGCCTCTCCGTGTGGAGCTTCCCACCTGCATGTACC +GGCTCCCCAACGTGCACGGCAGGAGCTACGGCCCAGCGCCGGGCGCTGGCCACGTGCAGG +TAGGAGCGCGGGGCCCCCCGCCCAGTGCGCACGCGCGGCGACCGGCTGCTGGCCCGGGTC +CCCCCAGGCCGGAGCGAGCGCGTCCCAACCGGTTCACGGCCCCACCCCGGCATCTGTGCC +GGCCGGCCAGGGACTCACTCAGACTTTTATGTTTTAAAAGATTTATCCAGGCCGGGCGCC +GTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCGGATCACCTGAGGT +CAGGAGTTCGAGACTAGCCTGGCCAACATGGTAAAACCTCGTCTCTACTAAAAATACAGA +AATTGGCCGGGTGTGGTGAGGCGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCAGGAG +AATCGTTTGAACCCTGGAGGCGGAGTTTGCAGTGAGCTGAGATCGAGCCATTGCACTCGA +GCCTGGGCAACAAGAGCTAAACTCTATCTCAAAAAAAAAAAAAAAAAAAAAAAAAATATA +TATATATATATATGTATGTAT diff --git a/paraphase/data/pms2/pms2_ref.fa.fai b/paraphase/data/pms2/pms2_ref.fa.fai index c9a4c62..aac690d 100644 --- a/paraphase/data/pms2/pms2_ref.fa.fai +++ b/paraphase/data/pms2/pms2_ref.fa.fai @@ -1 +1 @@ -chr7_5967000_5992500 25501 22 60 61 +chr7_5957000_6010000 53001 22 60 61 diff --git a/paraphase/data/rccx/rccx_config.yaml b/paraphase/data/rccx/rccx_config.yaml index 3123981..4884727 100755 --- a/paraphase/data/rccx/rccx_config.yaml +++ b/paraphase/data/rccx/rccx_config.yaml @@ -22,8 +22,6 @@ coordinates: deletion1_size: 6367 deletion2_size: 120 - noisy_region: [[32029159, 32029159], [32022483, 32022483]] - left_boundary: 32013300 right_boundary: 32046000 diff --git a/paraphase/data/strc/strc_config.yaml b/paraphase/data/strc/strc_config.yaml index c6ae844..861fbd6 100755 --- a/paraphase/data/strc/strc_config.yaml +++ b/paraphase/data/strc/strc_config.yaml @@ -19,6 +19,8 @@ coordinates: depth_region: [[43610000, 43660000]] + pivot_site: 43602487 + left_boundary: 43599500 right_boundary: 43619600 diff --git a/paraphase/genes/cfc1_phaser.py b/paraphase/genes/cfc1_phaser.py index 0e05349..d7415e8 100644 --- a/paraphase/genes/cfc1_phaser.py +++ b/paraphase/genes/cfc1_phaser.py @@ -24,13 +24,10 @@ def call(self): return None self.get_homopolymer() self.get_candidate_pos() - # add pivot site - if "130593061_A_G" not in self.candidate_pos: - self.candidate_pos.add("130593061_A_G") self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() - raw_read_haps = self.get_haplotypes_from_reads(self.het_sites) + raw_read_haps = self.get_haplotypes_from_reads(add_sites=["130593061_A_G"]) ( ass_haps, diff --git a/paraphase/genes/f8_phaser.py b/paraphase/genes/f8_phaser.py index 608a7fe..b36caab 100644 --- a/paraphase/genes/f8_phaser.py +++ b/paraphase/genes/f8_phaser.py @@ -96,7 +96,9 @@ def call(self): self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() - raw_read_haps = self.get_haplotypes_from_reads(self.het_sites, check_clip=True) + raw_read_haps = self.get_haplotypes_from_reads( + check_clip=True, kept_sites=["155386300_A_C", "155386860_C_G"] + ) ( ass_haps, diff --git a/paraphase/genes/ikbkg_phaser.py b/paraphase/genes/ikbkg_phaser.py index 59ab7b6..66d1476 100644 --- a/paraphase/genes/ikbkg_phaser.py +++ b/paraphase/genes/ikbkg_phaser.py @@ -46,6 +46,7 @@ def call(self): self.get_candidate_pos(min_vaf=0.095) + # add these sites for duplication/deletion calling var_found = False for var in self.candidate_pos: pos = int(var.split("_")[0]) @@ -68,9 +69,10 @@ def call(self): self.remove_noisy_sites() raw_read_haps = self.get_haplotypes_from_reads( - self.het_sites, check_clip=True, partial_deletion_reads=self.del1_reads_partial, + kept_sites=["154569800_T_G"], + add_sites=["154555882_C_G"], ) het_sites = self.het_sites if self.del1_reads_partial != set(): @@ -101,25 +103,26 @@ def call(self): pseudo_counter = 0 dup_counter = 0 deletion_haplotypes = [] - for i, hap in enumerate(ass_haps): - nsite = min(len(hap), 10) - start_seq = hap[:nsite] - if start_seq.startswith("0") is False: - if start_seq.count("1") >= start_seq.count("2"): - gene_counter += 1 - hap_name = f"ikbkg_hap{gene_counter}" - tmp.setdefault(hap, hap_name) - if "3" in hap: - deletion_haplotypes.append(hap_name) + pivot_index, index_found = self.get_pivot_site_index() + if index_found is True: + for i, hap in enumerate(ass_haps): + start_seq = hap[: pivot_index + 1] + if start_seq.startswith("0") is False: + if start_seq.count("1") >= start_seq.count("2"): + gene_counter += 1 + hap_name = f"ikbkg_hap{gene_counter}" + tmp.setdefault(hap, hap_name) + if "3" in hap: + deletion_haplotypes.append(hap_name) + else: + pseudo_counter += 1 + hap_name = f"pseudo_hap{pseudo_counter}" + tmp.setdefault(hap, hap_name) + if "3" in hap: + deletion_haplotypes.append(hap_name) else: - pseudo_counter += 1 - hap_name = f"pseudo_hap{pseudo_counter}" - tmp.setdefault(hap, hap_name) - if "3" in hap: - deletion_haplotypes.append(hap_name) - else: - dup_counter += 1 - tmp.setdefault(hap, f"dup_hap{dup_counter}") + dup_counter += 1 + tmp.setdefault(hap, f"dup_hap{dup_counter}") ass_haps = tmp haplotypes = None @@ -161,6 +164,14 @@ def call(self): new_allele.append(ass_haps[hap]) new_alleles.append(new_allele) + if gene_counter == 0 or pseudo_counter == 0: + total_cn = None + gene_counter = None + # homozygous case + if total_cn == 0: + total_cn = None + gene_counter = None + self.close_handle() return self.GeneCall( diff --git a/paraphase/genes/ncf1_phaser.py b/paraphase/genes/ncf1_phaser.py index f28fe9f..79f57ec 100644 --- a/paraphase/genes/ncf1_phaser.py +++ b/paraphase/genes/ncf1_phaser.py @@ -27,7 +27,7 @@ def call(self): return None pivot_site = self.pivot_site for pileupcolumn in self._bamh.pileup( - self.nchr, pivot_site - 1, pivot_site, truncate=True + self.nchr, pivot_site, pivot_site + 1, truncate=True ): bases = [ a.upper() for a in pileupcolumn.get_query_sequences(add_indels=True) @@ -37,13 +37,10 @@ def call(self): self.get_homopolymer() self.get_candidate_pos() - # add pivot site - if "74777266_G_A" not in self.candidate_pos: - self.candidate_pos.add("74777266_G_A") self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() - raw_read_haps = self.get_haplotypes_from_reads(self.het_sites) + raw_read_haps = self.get_haplotypes_from_reads(add_sites=["74777265_A_T"]) ( ass_haps, @@ -115,6 +112,10 @@ def call(self): counter_gene = None total_cn = None + # homozygous case + if total_cn == 0: + total_cn = None + self.close_handle() return self.GeneCall( diff --git a/paraphase/genes/neb_phaser.py b/paraphase/genes/neb_phaser.py index b8b50e1..7152cf1 100644 --- a/paraphase/genes/neb_phaser.py +++ b/paraphase/genes/neb_phaser.py @@ -31,7 +31,7 @@ def call(self): self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() - raw_read_haps = self.get_haplotypes_from_reads(self.het_sites) + raw_read_haps = self.get_haplotypes_from_reads() ( ass_haps, @@ -127,6 +127,10 @@ def call(self): total_cn = None new_alleles = [] + # homozygous case + if total_cn == 0: + total_cn = None + self.close_handle() return self.GeneCall( diff --git a/paraphase/genes/pms2_phaser.py b/paraphase/genes/pms2_phaser.py index 2330195..90003bf 100755 --- a/paraphase/genes/pms2_phaser.py +++ b/paraphase/genes/pms2_phaser.py @@ -27,9 +27,9 @@ def call(self): self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() # for distinguishing pms2 from pms2cl - self.het_sites.append("5989137_G_A") - - raw_read_haps = self.get_haplotypes_from_reads(self.het_sites, check_clip=True) + raw_read_haps = self.get_haplotypes_from_reads( + check_clip=True, add_sites=["5989137_G_A"] + ) ( ass_haps, @@ -77,6 +77,11 @@ def call(self): # bigger cnvs are not handled here yet if pms2_cn != 2: pms2_cn = None + + # homozygous case + if total_cn == 0: + total_cn = None + self.close_handle() return self.GeneCall( diff --git a/paraphase/genes/rccx_phaser.py b/paraphase/genes/rccx_phaser.py index 4b99b19..6180143 100644 --- a/paraphase/genes/rccx_phaser.py +++ b/paraphase/genes/rccx_phaser.py @@ -243,7 +243,7 @@ def annotate_var(self, allele_var): elif abs(len(tmp[1]) - len(tmp[2])) <= 1 and len(tmp[2]) >= 6: annotated_allele = "pseudogene_duplication" else: - annotated_allele = "duplicaton_WT_plus_" + ",".join(tmp[1]) + annotated_allele = "duplication_WT_plus_" + ",".join(tmp[1]) else: if abs(len(tmp[1]) - len(tmp[2])) <= 1 and len(tmp[2]) >= 6: annotated_allele = ",".join(tmp[0]) + "_pseudogene_duplication" @@ -367,7 +367,7 @@ def update_alleles( successful_phasing = True # add missing links when there is no two-cp haplotypes - if two_cp_haplotypes == []: + if two_cp_haplotypes == [] and len(ending_copies) <= 2: # add the missing link in cn=4 if ( len(final_haps) in [3, 4] @@ -509,11 +509,14 @@ def call(self): self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() - het_sites = self.het_sites raw_read_haps = self.get_haplotypes_from_reads( - het_sites, check_clip=True, partial_deletion_reads=self.del1_reads_partial + check_clip=True, + partial_deletion_reads=self.del1_reads_partial, + kept_sites=["32046300_G_A", "32013265_A_T"], ) + + het_sites = self.het_sites if self.del2_reads_partial != set(): raw_read_haps, het_sites = self.update_reads_for_deletions( raw_read_haps, @@ -614,7 +617,7 @@ def call(self): if ass_haps == [] and self.het_sites == []: # homozygous, feed all reads to call variants total_cn = 2 - if total_cn < 2: + if total_cn < 2 or len(ending_copies) > 2: total_cn = None annotated_alleles = self.annotate_alleles( diff --git a/paraphase/genes/smn1_phaser.py b/paraphase/genes/smn1_phaser.py index 4b0608e..eef1abd 100755 --- a/paraphase/genes/smn1_phaser.py +++ b/paraphase/genes/smn1_phaser.py @@ -511,14 +511,12 @@ def call(self): [self.del1_5p_pos1, self.del1_5p_pos2], ] self.get_candidate_pos(regions_to_check=regions_to_check) - # always add splice site - if self.candidate_pos != set(): - self.candidate_pos.add("70951946_C_T") - het_sites = sorted(list(self.candidate_pos)) - raw_read_haps = self.get_haplotypes_from_reads(het_sites) + self.het_sites = sorted(list(self.candidate_pos)) + raw_read_haps = self.get_haplotypes_from_reads(add_sites=["70951946_C_T"]) # update reads for those overlapping known deletions + het_sites = self.het_sites if self.smn2_del_reads_partial != set(): raw_read_haps, het_sites = self.update_reads_for_deletions( raw_read_haps, diff --git a/paraphase/genes/strc_phaser.py b/paraphase/genes/strc_phaser.py index 1224ab8..5fbd083 100644 --- a/paraphase/genes/strc_phaser.py +++ b/paraphase/genes/strc_phaser.py @@ -29,7 +29,6 @@ def set_parameter(self, config): self.del1_3p_pos2 = config["coordinates"]["hg38"]["del1_3p_pos2"] self.del1_5p_pos1 = config["coordinates"]["hg38"]["del1_5p_pos1"] self.del1_5p_pos2 = config["coordinates"]["hg38"]["del1_5p_pos2"] - self.intergenic = config["coordinates"]["hg38"]["depth_region"] self.depth_region = config["coordinates"]["hg38"]["depth_region"] def call(self): @@ -50,7 +49,7 @@ def call(self): self.het_sites = sorted(list(self.candidate_pos)) self.remove_noisy_sites() - raw_read_haps = self.get_haplotypes_from_reads(self.het_sites) + raw_read_haps = self.get_haplotypes_from_reads(add_sites=["43602487_C_G"]) het_sites = self.het_sites if self.del1_reads_partial != set(): raw_read_haps, het_sites = self.update_reads_for_deletions( @@ -73,6 +72,9 @@ def call(self): read_counts, ) = self.phase_haps(raw_read_haps) + haplotypes = None + dvar = None + two_cp_haps = [] tmp = {} counter_gene = 0 counter_pseudo = 0 @@ -85,8 +87,6 @@ def call(self): tmp.setdefault(hap, f"strc_hap{counter_gene}") ass_haps = tmp - haplotypes = None - dvar = None if self.het_sites != []: haplotypes, dvar = self.output_variants_in_haplotypes( ass_haps, @@ -94,28 +94,46 @@ def call(self): nonuniquely_supporting_reads, ) - two_cp_haps = [] - if intergenic_depth > 5 and len(ass_haps) == 2: - two_cp_haps = list(ass_haps.values()) - elif counter_gene == 1 or counter_pseudo == 1: - two_cp_haps = self.compare_depth(haplotypes) - for hap in two_cp_haps: - if "strcp1" not in hap: - counter_gene += 1 - else: - counter_pseudo += 1 + if counter_gene == 1 or counter_pseudo == 1: + two_cp_haps = self.compare_depth(haplotypes) + for hap in two_cp_haps: + if "strcp1" not in hap: + counter_gene += 1 + else: + counter_pseudo += 1 + if ( + intergenic_depth > 5 + and counter_gene == 1 + and counter_pseudo == 1 + and two_cp_haps == [] + ): + two_cp_haps = list(ass_haps.values()) + for hap in two_cp_haps: + if "strcp1" not in hap: + counter_gene += 1 + else: + counter_pseudo += 1 - total_cn = len(ass_haps) + len(two_cp_haps) - - # check depth between STRC and pseudogene - if self.mdepth is not None: - prob = self.depth_prob(int(intergenic_depth), self.mdepth / 2) - if prob[0] < 0.9 and counter_gene == 1: - counter_gene = None - total_cn = None - if prob[0] > 0.95 and counter_gene > 1 and two_cp_haps != []: - counter_gene = None - total_cn = None + total_cn = len(ass_haps) + len(two_cp_haps) + + # check depth between STRC and pseudogene + if self.mdepth is not None: + prob = self.depth_prob(int(intergenic_depth), self.mdepth / 2) + if prob[0] < 0.9 and counter_gene == 1: + counter_gene = None + total_cn = None + if prob[0] > 0.95 and counter_gene > 1 and counter_pseudo > 1: + counter_gene = None + total_cn = None + + # homozygous case + else: + total_cn = 2 + # both copies are pseudogene + if self.del1_reads_partial != set() or "43604720_G_A" in self.homo_sites: + counter_gene = 0 + else: + counter_gene = 2 self.close_handle() diff --git a/paraphase/genome_depth.py b/paraphase/genome_depth.py index 0989fbd..2ff6d3a 100755 --- a/paraphase/genome_depth.py +++ b/paraphase/genome_depth.py @@ -21,13 +21,11 @@ def get_genome_depth(self): at = line.split() nchr = at[0] pos1 = int(at[1]) - site_depth = 0 for pos in [pos1, pos1 + 1600]: - for pileupcolumn in self._bamh.pileup( - nchr, pos - 1, pos, truncate=True - ): - site_depth = pileupcolumn.get_num_aligned() - depth.append(site_depth) + site_depth = self._bamh.count( + nchr, pos - 1, pos, read_callback="all" + ) + depth.append(site_depth) self.mdepth = np.median(depth) self.mad = np.median([abs(a - self.mdepth) for a in depth]) / self.mdepth diff --git a/paraphase/phaser.py b/paraphase/phaser.py index bad990e..48aa4f5 100755 --- a/paraphase/phaser.py +++ b/paraphase/phaser.py @@ -10,6 +10,7 @@ import re import logging from scipy.stats import poisson +from collections import namedtuple from .haplotype_assembler import VariantGraph @@ -18,6 +19,15 @@ class Phaser: clip_5p = r"^\d+S|^\d+H" clip_3p = r"\d+S$|\d+H$" deletion = r"\d+D" + GeneCall = namedtuple( + "GeneCall", + "total_cn final_haplotypes two_copy_haplotypes \ + highest_total_cn assembled_haplotypes sites_for_phasing \ + unique_supporting_reads het_sites_not_used_in_phasing homozygous_sites \ + haplotype_details variant_genotypes nonunique_supporting_reads \ + read_details genome_depth", + ) + MEAN_BASE_QUAL = 25 def __init__(self, sample_id, outdir, wgs_depth=None, genome_bam=None): self.outdir = outdir @@ -69,11 +79,10 @@ def get_regional_depth(self, bam_handle, query_region, ninterval=100): depth = [] nstep = max(1, int((region[1] - region[0]) / ninterval)) for pos in range(region[0], region[1], nstep): - for pileupcolumn in bam_handle.pileup( - self.nchr, pos - 1, pos, truncate=True - ): - site_depth = pileupcolumn.get_num_aligned() - depth.append(site_depth) + site_depth = bam_handle.count( + self.nchr, pos - 1, pos, read_callback="all" + ) + depth.append(site_depth) region_depth.append(np.median(depth)) return region_depth @@ -209,7 +218,42 @@ def get_read_names(self, read, partial_deletion_reads): def get_haplotypes_from_reads( self, - het_sites, + exclude_reads=[], + min_mapq=5, + min_clip_len=50, + check_clip=False, + partial_deletion_reads=[], + kept_sites=[], + add_sites=[], + ): + """ + Go through reads and get bases at sites of interest. + Two rounds, with variant site filtering in between. + """ + raw_read_haps = self.get_haplotypes_from_reads_step( + exclude_reads, + min_mapq, + min_clip_len, + check_clip, + partial_deletion_reads, + ) + self.remove_var(raw_read_haps, kept_sites) + if self.het_sites != []: + for var in add_sites: + if var not in self.het_sites: + self.het_sites.append(var) + self.het_sites = sorted(self.het_sites) + raw_read_haps = self.get_haplotypes_from_reads_step( + exclude_reads, + min_mapq, + min_clip_len, + check_clip, + partial_deletion_reads, + ) + return raw_read_haps + + def get_haplotypes_from_reads_step( + self, exclude_reads=[], min_mapq=5, min_clip_len=50, @@ -222,41 +266,55 @@ def get_haplotypes_from_reads( read_haps (dict of str:list): collapse each read into just the positions of interest. 1 corresponds to ref, 2 corresponds to alt """ + het_sites = self.het_sites read_haps = {} nvar = len(het_sites) for dsnp_index, allele_site in enumerate(het_sites): snp_position_gene1, allele1, allele2, *at = allele_site.split("_") snp_position = int(snp_position_gene1) + reads_with_flanking_indels = [] for pileupcolumn in self._bamh.pileup( self.nchr, - snp_position - 1, + snp_position - 2, snp_position, truncate=True, - min_base_quality=29, + min_base_quality=self.MEAN_BASE_QUAL, ): - for read in pileupcolumn.pileups: - read_names = self.get_read_names( - read.alignment, partial_deletion_reads - ) - for read_name in read_names: - if ( - not read.is_del - and not read.is_refskip - and not read.alignment.is_secondary - and read.alignment.mapping_quality >= min_mapq - and read_name not in exclude_reads - ): - read_seq = read.alignment.query_sequence - start_pos = read.query_position - end_pos = start_pos + 1 - if end_pos < len(read_seq): - hap = read_seq[start_pos:end_pos] - if read_name not in read_haps: - read_haps.setdefault(read_name, ["x"] * nvar) - if hap.upper() == allele1.upper(): - read_haps[read_name][dsnp_index] = "1" - elif hap.upper() == allele2.upper(): - read_haps[read_name][dsnp_index] = "2" + # require that the base on the read is not flanked by any indels + if pileupcolumn.reference_pos == snp_position - 2: + for read in pileupcolumn.pileups: + if read.indel != 0 or read.is_del: + read_names = self.get_read_names( + read.alignment, partial_deletion_reads + ) + for read_name in read_names: + reads_with_flanking_indels.append(read_name) + if pileupcolumn.reference_pos == snp_position - 1: + for read in pileupcolumn.pileups: + read_names = self.get_read_names( + read.alignment, partial_deletion_reads + ) + for read_name in read_names: + if ( + not read.is_del + and not read.is_refskip + and not read.alignment.is_secondary + and read.alignment.mapping_quality >= min_mapq + and read_name not in exclude_reads + and read.indel == 0 + and read_name not in reads_with_flanking_indels + ): + read_seq = read.alignment.query_sequence + start_pos = read.query_position + end_pos = start_pos + 1 + if end_pos < len(read_seq): + hap = read_seq[start_pos:end_pos] + if read_name not in read_haps: + read_haps.setdefault(read_name, ["x"] * nvar) + if hap.upper() == allele1.upper(): + read_haps[read_name][dsnp_index] = "1" + elif hap.upper() == allele2.upper(): + read_haps[read_name][dsnp_index] = "2" # for softclips starting at a predefined position, mark sites as 0 instead of x if check_clip: @@ -269,34 +327,59 @@ def get_haplotypes_from_reads( self.nchr, clip_position - 10, clip_position + 10 ): read_name = self.get_read_name(read) - if read_name in read_haps: - if abs(read.reference_end - clip_position) < 20: - find_clip_3p = re.findall( - self.clip_3p, read.cigarstring - ) - if ( - find_clip_3p != [] - and int(find_clip_3p[0][:-1]) >= min_clip_len - ): - read_haps[read_name][dsnp_index] = "0" + if read_name not in read_haps: + read_haps.setdefault(read_name, ["x"] * nvar) + if abs(read.reference_end - clip_position) < 20: + find_clip_3p = re.findall( + self.clip_3p, read.cigarstring + ) + if ( + find_clip_3p != [] + and int(find_clip_3p[0][:-1]) >= min_clip_len + ): + read_haps[read_name][dsnp_index] = "0" for clip_position in sorted(self.clip_5p_positions, reverse=True): if snp_position < clip_position: for read in self._bamh.fetch( self.nchr, clip_position - 10, clip_position + 10 ): read_name = self.get_read_name(read) - if read_name in read_haps: - if abs(read.reference_start - clip_position) < 20: - find_clip_5p = re.findall( - self.clip_5p, read.cigarstring - ) - if ( - find_clip_5p != [] - and int(find_clip_5p[0][:-1]) >= min_clip_len - ): - read_haps[read_name][dsnp_index] = "0" + if read_name not in read_haps: + read_haps.setdefault(read_name, ["x"] * nvar) + if abs(read.reference_start - clip_position) < 20: + find_clip_5p = re.findall( + self.clip_5p, read.cigarstring + ) + if ( + find_clip_5p != [] + and int(find_clip_5p[0][:-1]) >= min_clip_len + ): + read_haps[read_name][dsnp_index] = "0" return read_haps + def remove_var(self, raw_read_haps, kept_sites): + """remove variants that are not present after checking each read-haplotype""" + bases_per_site = {} + sites_to_remove = [] + for i in range(len(self.het_sites)): + for read, hap in raw_read_haps.items(): + base = hap[i] + bases_per_site.setdefault(i, []).append(base) + + for pos in bases_per_site: + bases = bases_per_site[pos] + bases_x = bases.count("x") + bases_ref = bases.count("1") + bases_alt = bases.count("2") + this_var = self.het_sites[pos] + if bases_x == len(bases): + sites_to_remove.append(this_var) + if bases_ref + bases_alt == len(bases) - bases_x and bases_alt <= 3: + if this_var not in kept_sites: + sites_to_remove.append(this_var) + for var in sites_to_remove: + self.het_sites.remove(var) + def allow_del_bases(self, pos): return False @@ -343,53 +426,22 @@ def get_candidate_pos(self, regions_to_check=[], min_read_support=5, min_vaf=0.1 del_bases_count = all_bases.count("*") # get reference base offset_pos = pos - self.offset - ref_seq = self._refh.fetch(self.nchr_old, offset_pos - 1, offset_pos) + ref_seq_genome = self._refh.fetch(self.nchr_old, offset_pos - 1, offset_pos) if total_depth >= min_read_support and ( del_bases_count < min_read_support or self.allow_del_bases(pos) ): all_bases = [a for a in all_bases if a != "*"] counter = Counter(all_bases) - bases = counter.most_common(2) - if ( - len(counter) >= 2 - and bases[1][1] >= min_read_support - and bases[1][1] / total_depth > min_vaf - ): - var_seq = None - found_ref = ref_seq in [a[0] for a in bases] - for base in bases: - if base[0] != ref_seq: - var_seq = base[0] - break - if found_ref is True and var_seq is not None: - # SNV - if "-" not in var_seq and "+" not in var_seq: - if pos not in self.homopolymer_sites: - variants.setdefault(pos, (ref_seq, var_seq)) - else: - prohibited_bases = self.homopolymer_sites[pos].split( - "," - ) - if var_seq not in prohibited_bases: - if "1" in prohibited_bases: - variants.setdefault(pos, (ref_seq, var_seq)) - else: - variants_no_phasing.setdefault( - pos, (ref_seq, var_seq) - ) - # indels - elif pos not in self.homopolymer_sites: - ref_seq, var_seq, indel_size = self.process_indel( - pos, ref_seq, var_seq - ) - if indel_size < 25: - variants_no_phasing.setdefault(pos, (ref_seq, var_seq)) - elif len(counter) == 1 or ( + # include multi-allelic sites + bases = counter.most_common(3) + # homozygous + if len(counter) == 1 or ( len(counter) >= 2 and bases[0][1] > len(all_bases) - min_read_support ): var_seq = bases[0][0] + ref_seq = ref_seq_genome if var_seq != ref_seq: # SNV and indels if "-" not in var_seq and "+" not in var_seq: @@ -399,7 +451,7 @@ def get_candidate_pos(self, regions_to_check=[], min_read_support=5, min_vaf=0.1 and del_bases_count >= min_read_support and pos not in self.homopolymer_sites ): - variants.setdefault(pos, (ref_seq, var_seq)) + variants.setdefault(pos, []).append((ref_seq, var_seq)) elif pos not in self.homopolymer_sites or ( pos in self.homopolymer_sites and var_seq @@ -412,14 +464,54 @@ def get_candidate_pos(self, regions_to_check=[], min_read_support=5, min_vaf=0.1 ) if indel_size < 25: self.homo_sites.append(f"{pos}_{ref_seq}_{var_seq}") + elif len(counter) >= 2: + found_ref = ref_seq_genome in [a[0] for a in bases] + if found_ref: + for var_seq, var_count in bases: + ref_seq = ref_seq_genome + if ( + var_seq != ref_seq + and var_count >= min_read_support + and var_count / total_depth > min_vaf + ): + # SNV + if "-" not in var_seq and "+" not in var_seq: + if pos not in self.homopolymer_sites: + variants.setdefault(pos, []).append( + (ref_seq, var_seq) + ) + else: + prohibited_bases = self.homopolymer_sites[ + pos + ].split(",") + if var_seq not in prohibited_bases: + if "1" in prohibited_bases: + variants.setdefault(pos, []).append( + (ref_seq, var_seq) + ) + else: + variants_no_phasing.setdefault( + pos, (ref_seq, var_seq) + ) + # indels + elif pos not in self.homopolymer_sites: + ref_seq, var_seq, indel_size = self.process_indel( + pos, ref_seq, var_seq + ) + if indel_size < 25: + variants_no_phasing.setdefault( + pos, (ref_seq, var_seq) + ) + # exclude variants caused by shifted softclips of the big deletions excluded_variants = [] for region in regions_to_check: var_to_check = [a for a in variants if region[0] < a < region[1]] excluded_variants += var_to_check for pos in variants: - if pos not in excluded_variants: - ref_seq, var_seq = variants[pos] + # for now, filter out multi-allelic sites + if pos not in excluded_variants and len(variants[pos]) == 1: + ref_seq, var_seq = variants[pos][0] self.candidate_pos.add(f"{pos}_{ref_seq}_{var_seq}") excluded_variants = [] @@ -648,9 +740,9 @@ def update_reads_for_deletions( ): hap[pos1] = "0" else: - flanking_left = hap[min(0, pos1 - 2) : pos1] + flanking_left = hap[max(0, pos1 - 2) : pos1] flanking_right = hap[ - max(pos1 + 1, len(hap)) : max(pos1 + 3, len(hap)) + min(pos1 + 1, len(hap)) : min(pos1 + 3, len(hap)) ] if "x" not in flanking_left and "x" not in flanking_right: hap[pos1] = "1" @@ -699,7 +791,7 @@ def get_read_counts(self, uniquely_supporting_haps): read_count.setdefault(hap, len(lreads)) return read_count - def phase_haps(self, raw_read_haps, debug=False): + def phase_haps(self, raw_read_haps, min_support=4, debug=False): """ Assemble and evaluate haplotypes """ @@ -722,8 +814,45 @@ def phase_haps(self, raw_read_haps, debug=False): ) ass_haps, original_haps, hcn = hap_graph.run(debug=debug, make_plot=debug) - read_support = VariantGraph.match_reads_and_haplotypes(raw_read_haps, ass_haps) + ( + uniquely_supporting_reads, + nonuniquely_supporting_reads, + read_counts, + ) = self.get_read_support(raw_read_haps, haplotypes_to_reads, ass_haps) + + # remove spurious ones + ass_haps = self.adjust_spurious_haplotypes(uniquely_supporting_reads) + ( + uniquely_supporting_reads, + nonuniquely_supporting_reads, + read_counts, + ) = self.get_read_support(raw_read_haps, haplotypes_to_reads, ass_haps) + + # remove low-support ones + ass_haps = [ + a + for a in uniquely_supporting_reads + if len(uniquely_supporting_reads[a]) >= min_support + ] + ( + uniquely_supporting_reads, + nonuniquely_supporting_reads, + read_counts, + ) = self.get_read_support(raw_read_haps, haplotypes_to_reads, ass_haps) + return ( + ass_haps, + original_haps, + hcn, + uniquely_supporting_reads, + nonuniquely_supporting_reads, + raw_read_haps, + read_counts, + ) + + def get_read_support(self, raw_read_haps, haplotypes_to_reads, ass_haps): + """Find uniquely and nonuniquely supporting reads for given haplotypes""" + read_support = VariantGraph.match_reads_and_haplotypes(raw_read_haps, ass_haps) uniquely_supporting_haps = read_support.unique read_counts = self.get_read_counts(uniquely_supporting_haps) @@ -744,12 +873,8 @@ def phase_haps(self, raw_read_haps, debug=False): read, read_support.by_read[read] ) return ( - ass_haps, - original_haps, - hcn, uniquely_supporting_reads, nonuniquely_supporting_reads, - raw_read_haps, read_counts, ) @@ -796,7 +921,11 @@ def compare_depth(self, haplotypes, loose=False): for pos in sites: hap_base = sites[pos] for pileupcolumn in bamh.pileup( - self.nchr, pos - 1, pos, truncate=True, min_base_quality=29 + self.nchr, + pos - 1, + pos, + truncate=True, + min_base_quality=self.MEAN_BASE_QUAL, ): bases = [a.upper() for a in pileupcolumn.get_query_sequences()] base_num = bases.count(hap_base) @@ -815,6 +944,135 @@ def compare_depth(self, haplotypes, loose=False): return two_cp_haps + def adjust_spurious_haplotypes(self, uniquely_supporting_reads, flanking_bp=10): + """Identify spurious haplotypes caused by locally misaligned reads""" + passing_haplotypes = list(uniquely_supporting_reads.keys()) + suspicious_hap_pair = [] + lhap = uniquely_supporting_reads.keys() + for hap1 in lhap: + for hap2 in lhap: + if hap1 != hap2: + nmatch = 0 + nmismatch = 0 + mismatch_sites = [] + for i, base1 in enumerate(hap1): + base2 = hap2[i] + if "x" not in [base1, base2]: + if base1 == base2: + nmatch += 1 + elif base1 in ["1", "2"] and base2 in ["1", "2"]: + nmismatch += 1 + mismatch_sites.append(self.het_sites[i]) + if nmatch >= 5 and nmismatch == 1 and len(mismatch_sites) == 1: + mismatch_pos = int(mismatch_sites[0].split("_")[0]) + hap1_reads = uniquely_supporting_reads[hap1] + hap2_reads = uniquely_supporting_reads[hap2] + hap_pair = None + if len(hap1_reads) <= 5 and len(hap2_reads) >= 6: + hap_pair = [hap2, hap1] + elif len(hap2_reads) <= 5 and len(hap1_reads) >= 6: + hap_pair = [hap1, hap2] + if ( + hap_pair is not None + and [ + hap_pair, + mismatch_pos, + ] + not in suspicious_hap_pair + ): + suspicious_hap_pair.append([hap_pair, mismatch_pos]) + + for hap_pair, mismatch_pos in suspicious_hap_pair: + hap1, hap2 = hap_pair + hap1_reads = uniquely_supporting_reads[hap1] + hap2_reads = uniquely_supporting_reads[hap2] + hap1_reads_at_pos = [] + hap2_reads_at_pos = [] + for pileupcolumn in self._bamh.pileup( + self.nchr, + mismatch_pos - 1, + mismatch_pos, + truncate=True, + min_base_quality=self.MEAN_BASE_QUAL, + ): + for read in pileupcolumn.pileups: + if not read.is_del and not read.is_refskip: + read_name = read.alignment.query_name + read_seq = read.alignment.query_sequence + read_pos = read.query_position + if ( + read_name in hap1_reads + hap2_reads + and read_pos >= flanking_bp + and read_pos + flanking_bp < len(read_seq) + ): + start_pos = read_pos - flanking_bp + end_pos = read_pos + flanking_bp + if read_name in hap1_reads: + hap1_reads_at_pos.append(read_seq[start_pos:end_pos]) + if read_name in hap2_reads: + hap2_reads_at_pos.append(read_seq[start_pos:end_pos]) + + if set(hap1_reads_at_pos).intersection(set(hap2_reads_at_pos)) != set(): + passing_haplotypes.remove(hap2) + return passing_haplotypes + + def call(self): + """Main function to phase haplotypes and call copy numbers""" + if self.check_coverage_before_analysis() is False: + return None + self.get_homopolymer() + self.get_candidate_pos() + self.het_sites = sorted(list(self.candidate_pos)) + self.remove_noisy_sites() + + raw_read_haps = self.get_haplotypes_from_reads() + + ( + ass_haps, + original_haps, + hcn, + uniquely_supporting_reads, + nonuniquely_supporting_reads, + raw_read_haps, + read_counts, + ) = self.phase_haps(raw_read_haps) + + tmp = {} + for i, hap in enumerate(ass_haps): + tmp.setdefault(hap, f"hap{i+1}") + ass_haps = tmp + + haplotypes = None + dvar = None + if self.het_sites != []: + haplotypes, dvar = self.output_variants_in_haplotypes( + ass_haps, + uniquely_supporting_reads, + nonuniquely_supporting_reads, + ) + + two_cp_haps = self.compare_depth(haplotypes) + total_cn = len(ass_haps) + len(two_cp_haps) + + self.close_handle() + + return self.GeneCall( + total_cn, + ass_haps, + two_cp_haps, + hcn, + original_haps, + self.het_sites, + uniquely_supporting_reads, + self.het_no_phasing, + self.homo_sites, + haplotypes, + dvar, + nonuniquely_supporting_reads, + raw_read_haps, + self.mdepth, + ) + def close_handle(self): self._bamh.close() self._refh.close() diff --git a/paraphase/prepare_bam_and_vcf.py b/paraphase/prepare_bam_and_vcf.py index 32e2ef0..af8164d 100755 --- a/paraphase/prepare_bam_and_vcf.py +++ b/paraphase/prepare_bam_and_vcf.py @@ -388,9 +388,9 @@ def get_var(all_bases, ref_seq): var_seq = most_common_base[0][0] ad = most_common_base[0][1] if ( - dp >= 3 - and ad >= 2 - and (len(most_common_base) == 1 or ad > most_common_base[1][1]) + len(var_seq) == 1 and len(ref_seq) == 1 and dp >= 3 and ad > dp * 0.5 + ) or ( + (len(var_seq) > 1 or len(ref_seq) > 1) and dp >= 5 and ad >= dp * 0.7 ): if var_seq == ref_seq or var_seq == "*": gt = "0" @@ -557,12 +557,18 @@ def pileup_to_variant( refh_pos = pos ref_seq = refh.fetch(ref_name, refh_pos - 1, refh_pos) alt_all_reads = self.get_var(all_bases, ref_seq) - if None not in hap_bound and hap_bound[0] < true_pos < hap_bound[1]: + if hap_bound == [] or ( + None not in hap_bound and hap_bound[0] < true_pos < hap_bound[1] + ): # use only unique reads for positions at the edge - if true_pos < hap_bound[2] or true_pos > hap_bound[3]: + if ( + hap_bound == [] + or true_pos < hap_bound[2] + or true_pos > hap_bound[3] + ): bases_uniq_reads = [] for i, read_base in enumerate(all_bases): - if read_names[pos][i] in uniq_reads: + if uniq_reads is None or read_names[pos][i] in uniq_reads: bases_uniq_reads.append(read_base) alt_uniq_reads = self.get_var(bases_uniq_reads, ref_seq) if alt_uniq_reads[-1] != ".": @@ -623,6 +629,41 @@ def run_without_realign(self): bamh = pysam.AlignmentFile(self.bam, "rb") refh = pysam.FastaFile(self.ref) + if final_haps == {}: + hap_name = "homozygous_hap1" + hap_vcf_out = os.path.join( + self.vcf_dir, self.sample_id + f"_{self.gene}_{hap_name}.vcf" + ) + vcf_out = open(hap_vcf_out, "w") + self.write_header(vcf_out) + pileups_raw = {} + read_names = {} + for pileupcolumn in bamh.pileup( + self.nchr, + truncate=True, + min_base_quality=30, + ): + pos = pileupcolumn.pos + 1 + this_pos_bases = [ + a.upper() for a in pileupcolumn.get_query_sequences(add_indels=True) + ] + pileups_raw.setdefault(pos, this_pos_bases) + read_names.setdefault(pos, pileupcolumn.get_query_names()) + variants_called = self.pileup_to_variant( + pileups_raw, + read_names, + None, + refh, + 0 - self.offset, + [], + vcf_out, + ) + vcf_out.close() + for pos, var_name, dp, ad, qual, gt in variants_called: + vars.setdefault( + pos, [[var_name, dp, ad, qual, gt], [var_name, dp, ad, qual, gt]] + ) + i = 0 for hap_name in final_haps.values(): hap_bound = self.get_hap_bound(hap_name) diff --git a/setup.py b/setup.py index 094a8c6..16bd1ca 100644 --- a/setup.py +++ b/setup.py @@ -8,7 +8,7 @@ def readme(): setup( name="paraphase", - version="2.0.0", + version="2.1.0", description="paraphase: HiFi-based caller for highly homologous genes", long_description=readme(), url="https://github.com/PacificBiosciences/paraphase",