From 99954572947803f57b73b09bea7c6652b38b9065 Mon Sep 17 00:00:00 2001 From: Joe Zhu Date: Mon, 20 Nov 2017 01:10:18 +0000 Subject: [PATCH] bwd seems to work now --- Makefile.am | 19 +++--- src/ibd.cpp | 42 ++++++++---- src/panel.hpp | 5 ++ tests/unittest/test_ibd.cpp | 127 +++++++++++++++++++++++++----------- 4 files changed, 135 insertions(+), 58 deletions(-) diff --git a/Makefile.am b/Makefile.am index 915e21f4..046eab57 100644 --- a/Makefile.am +++ b/Makefile.am @@ -51,15 +51,16 @@ dEploid_prof_LDADD = $(common_LDADD) unit_tests_SOURCES = $(common_src) \ tests/unittest/test_runner.cpp \ - tests/unittest/test_updateSingleHap.cpp \ - tests/unittest/test_utilities.cpp \ - tests/unittest/test_ibd.cpp \ - tests/unittest/test_panel.cpp \ - tests/unittest/test_txtReader.cpp \ - tests/unittest/test_dEploidIO.cpp \ - tests/unittest/test_mcmc.cpp \ - tests/unittest/test_updatePairHap.cpp \ - tests/unittest/test_vcfReader.cpp + tests/unittest/test_ibd.cpp + +# tests/unittest/test_updateSingleHap.cpp \ +# tests/unittest/test_utilities.cpp \ +# tests/unittest/test_panel.cpp \ +# tests/unittest/test_txtReader.cpp \ +# tests/unittest/test_dEploidIO.cpp \ +# tests/unittest/test_mcmc.cpp \ +# tests/unittest/test_updatePairHap.cpp \ +# tests/unittest/test_vcfReader.cpp unit_tests_CXXFLAGS = $(common_flags) -DNDEBUG -DUNITTEST -Wno-write-strings --coverage unit_tests_LDADD = -lcppunit -ldl $(common_LDADD) diff --git a/src/ibd.cpp b/src/ibd.cpp index 9ee9189f..eb579f81 100644 --- a/src/ibd.cpp +++ b/src/ibd.cpp @@ -332,9 +332,9 @@ bool twoVectorsAreSame(vector vec1, vector vec2){ } - IBDpath::IBDpath(){}; + void IBDpath::init(DEploidIO &dEploidIO, RandomGenerator* rg){ this->ibdRg_ = rg; this->setNLoci(dEploidIO.nLoci()); @@ -408,7 +408,8 @@ vector IBDpath::findWhichIsSomething(vector tmpOp, size_t some void IBDpath::buildPathProbabilityForPainting(vector proportion){ - vector effectiveKPrior = this->computeEffectiveKPrior(this->theta()); + //vector effectiveKPrior = this->computeEffectiveKPrior(this->theta()); + vector effectiveKPrior = vector (this->hprior.nPattern(), 1.0/this->hprior.nPattern()); vector statePrior = this->computeStatePrior(effectiveKPrior); // First building the path likelihood this->computeIbdPathFwdProb(proportion, statePrior); @@ -424,6 +425,7 @@ void IBDpath::computeIbdPathBwdProb(vector proportion, vector //tmpBw = (a.prior * 1/table(state.idx)) %*% tij //bwd[,n.loci] = tmpBw/sum(tmpBw) + cout << " start building ibd bwd "<< endl; vector tmp = vector (hprior.stateIdxFreq.size()); assert(effectiveKPrior.size() == hprior.stateIdxFreq.size()); for (size_t i = 0; i < tmp.size(); i++){ @@ -438,18 +440,23 @@ void IBDpath::computeIbdPathBwdProb(vector proportion, vector } this->bwd.push_back(tmpBw); - for ( size_t rev_siteI = 1; rev_siteI < this->nLoci(); rev_siteI++ ){ size_t siteI = this->nLoci()-rev_siteI; + vector lk = computeLlkOfStatesAtSiteI(proportion, siteI); +//vector lk = vector (hprior.nState(), 1.0); + cout << "lk = " ; for (double l :lk){cout << l << " ";}cout< bSumState = vector (hprior.nState()); +cout <<"bsumstate = "; + vector bSumState = vector (hprior.nPattern()); for ( size_t i = 0; i < bSumState.size(); i++){ for ( size_t j = 0; j < hprior.nState(); j++ ){ bSumState[i] += ibdTransProbs[i][j]*this->bwd.back()[j]; } +cout<<" "< vNoRecomb(hprior.nState()); for (size_t i = 0; i < hprior.stateIdx.size(); i++ ){ vNoRecomb[i] = bSumState[hprior.stateIdx[i]]; @@ -458,16 +465,19 @@ void IBDpath::computeIbdPathBwdProb(vector proportion, vector for (size_t i = 0; i < hprior.nState(); i++ ){ tmpBw[i] = 0; for (size_t j = 0; j < lk.size(); j++){ - tmpBw[i] += (lk[j] * bwd.back()[j]); + tmpBw[i] += (lk[j] * bwd.back()[j])*this->ibdRecombProbs.pRec_[siteI-1]; } - tmpBw[i] *= this->ibdRecombProbs.pRec_[siteI] * statePrior[i]; - tmpBw[i] += lk[i] * (1-this->ibdRecombProbs.pRec_[siteI]) * vNoRecomb[i]; + cout<< tmpBw[i] << ", "; + tmpBw[i] *= statePrior[i]; + cout<< tmpBw[i] << ", "; + tmpBw[i] += lk[i] * (this->ibdRecombProbs.pNoRec_[siteI-1]) * vNoRecomb[i]; + cout<< tmpBw[i] << "\n"; tmpBw[i] *= hprior.priorProb[i][siteI]; } normalizeBySum(tmpBw); this->bwd.push_back(tmpBw); + cout< proportion, vector } lk = computeLlkOfStatesAtSiteI(proportion, siteI); + //cout << "lk = " ; for (double l :lk){cout << l << " ";}cout<updateFmAtSiteI(vPrior, lk); } } @@ -535,12 +546,18 @@ void IBDpath::updateFmAtSiteI(vector & prior, vector & llk){ void IBDpath::combineFwdBwd(){ for (size_t i = 0; i < nLoci(); i++ ){ normalizeBySum(fm[i]); + //normalizeBySum(bwd[i]); vector tmp; + cout << " site " << i << endl; for (size_t j = 0; j < fm[i].size(); j++){ - tmp.push_back(exp(log(fm[i][j])+log(bwd[i][j]))); + + //tmp.push_back(exp(log(fm[i][j])+log(bwd[i][j]))); + //tmp.push_back(exp(log(fm[i][j]))); + tmp.push_back(exp(log(fm[i][j]))); + //cout << "fwd = "<::min(); + //cout << normalized< pRec_; vector < double > pNoRec_; // = 1.0 - pRec; diff --git a/tests/unittest/test_ibd.cpp b/tests/unittest/test_ibd.cpp index 53958acd..db796241 100644 --- a/tests/unittest/test_ibd.cpp +++ b/tests/unittest/test_ibd.cpp @@ -233,11 +233,15 @@ class TestIBDpath : public CppUnit::TestCase { CPPUNIT_TEST( testIbdTransProbs ); CPPUNIT_TEST( testComputeUniqueEffectiveKCount ); CPPUNIT_TEST( testIBDconfigureHeader ); + CPPUNIT_TEST( testStatePrior ); + //CPPUNIT_TEST( checkFwd ); + CPPUNIT_TEST( checkBwd ); CPPUNIT_TEST_SUITE_END(); private: - IBDpath* ibdPath_; IBDpath* ibdPath2_; + IBDpath* ibdPath3_; + IBDpath* ibdPath5_; DEploidIO* dEploidIO_; MersenneTwister* rg_; double epsilon2; @@ -250,31 +254,40 @@ class TestIBDpath : public CppUnit::TestCase { dEploidIO_->setKstrain(3); dEploidIO_->plaf_ = vector ({0.1, .4, .4, .3, .2, .5}); vector < vector > testPosition; - testPosition.push_back(vector ({200, 3000})); - testPosition.push_back(vector ({300})); - testPosition.push_back(vector ({300, 400, 500})); + testPosition.push_back(vector ({1,2,3,4,5,6})); + //testPosition.push_back(vector ({200, 3000})); + //testPosition.push_back(vector ({300})); + //testPosition.push_back(vector ({300, 400, 500})); dEploidIO_->position_ = testPosition; dEploidIO_->nLoci_ = 6; - dEploidIO_->chrom_ = vector ({"chrom1", "chrom2"}); + //dEploidIO_->chrom_ = vector ({"chrom1", "chrom2", "chrom3"}); + dEploidIO_->chrom_ = vector ({"chrom1"}); + dEploidIO_->useConstRecomb_ = true; + dEploidIO_->constRecombProb_ = 0.000001; rg_ = new MersenneTwister(dEploidIO_->randomSeed()); epsilon2 = 0.001; - ibdPath_ = new IBDpath; - this->ibdPath_->init(*dEploidIO_, rg_); + ibdPath3_ = new IBDpath; + this->ibdPath3_->init(*dEploidIO_, rg_); dEploidIO_->setKstrain(5); + ibdPath5_ = new IBDpath; + this->ibdPath5_->init(*dEploidIO_, rg_); + dEploidIO_->setKstrain(2); ibdPath2_ = new IBDpath; this->ibdPath2_->init(*dEploidIO_, rg_); } void tearDown() { - delete ibdPath_; delete ibdPath2_; + delete ibdPath3_; + delete ibdPath5_; delete rg_; delete dEploidIO_; } void testMainConstructor(){ - + for (double p : ibdPath2_->ibdRecombProbs.pRec_){cout <ibdRecombProbs.pRec_){cout <ibdPath_->llkSurf.size(), (size_t)6 ); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.149687, this->ibdPath_->llkSurf[0][0], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 62.602446, this->ibdPath_->llkSurf[0][1], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 62.602446, this->ibdPath_->llkSurf[1][0], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.149687, this->ibdPath_->llkSurf[1][1], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 50.250071, this->ibdPath_->llkSurf[2][0], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 1.507423, this->ibdPath_->llkSurf[2][1], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 24.735000, this->ibdPath_->llkSurf[3][0], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 24.735000, this->ibdPath_->llkSurf[3][1], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.968471, this->ibdPath_->llkSurf[4][0], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 1.029853, this->ibdPath_->llkSurf[4][1], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.800135, this->ibdPath_->llkSurf[5][0], epsilon2); - CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.800135, this->ibdPath_->llkSurf[5][1], epsilon2); + CPPUNIT_ASSERT_EQUAL( this->ibdPath3_->llkSurf.size(), (size_t)6 ); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.149687, this->ibdPath3_->llkSurf[0][0], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 62.602446, this->ibdPath3_->llkSurf[0][1], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 62.602446, this->ibdPath3_->llkSurf[1][0], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.149687, this->ibdPath3_->llkSurf[1][1], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 50.250071, this->ibdPath3_->llkSurf[2][0], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 1.507423, this->ibdPath3_->llkSurf[2][1], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 24.735000, this->ibdPath3_->llkSurf[3][0], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 24.735000, this->ibdPath3_->llkSurf[3][1], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.968471, this->ibdPath3_->llkSurf[4][0], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 1.029853, this->ibdPath3_->llkSurf[4][1], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.800135, this->ibdPath3_->llkSurf[5][0], epsilon2); + CPPUNIT_ASSERT_DOUBLES_EQUAL ( 2.800135, this->ibdPath3_->llkSurf[5][1], epsilon2); } @@ -319,38 +332,38 @@ class TestIBDpath : public CppUnit::TestCase { //[4,] 0 0 1 1 1 1 0 0 //[5,] 0 0 0 0 0 0 1 1 //vector tmpPlaf = vector ({0.1, 0.2, 0.3}); - //CPPUNIT_ASSERT_NO_THROW(this->ibdPath_->hprior.buildHprior(3, tmpPlaf)); - CPPUNIT_ASSERT_EQUAL(this->ibdPath_->hprior.nPattern(), (size_t)5); - CPPUNIT_ASSERT_EQUAL(this->ibdPath_->hprior.nState(), (size_t)22); + //CPPUNIT_ASSERT_NO_THROW(this->ibdPath3_->hprior.buildHprior(3, tmpPlaf)); + CPPUNIT_ASSERT_EQUAL(this->ibdPath3_->hprior.nPattern(), (size_t)5); + CPPUNIT_ASSERT_EQUAL(this->ibdPath3_->hprior.nState(), (size_t)22); - //CPPUNIT_ASSERT_NO_THROW(this->ibdPath_->makeIbdTransProbs()); - CPPUNIT_ASSERT_EQUAL((size_t)5, this->ibdPath_->ibdTransProbs.size()); - double tmpValue = sumOfMat(this->ibdPath_->ibdTransProbs); + //CPPUNIT_ASSERT_NO_THROW(this->ibdPath3_->makeIbdTransProbs()); + CPPUNIT_ASSERT_EQUAL((size_t)5, this->ibdPath3_->ibdTransProbs.size()); + double tmpValue = sumOfMat(this->ibdPath3_->ibdTransProbs); CPPUNIT_ASSERT_EQUAL((double)22.0, tmpValue); for ( size_t i = 0; i < 22; i++){ - CPPUNIT_ASSERT_EQUAL(this->ibdPath_->ibdTransProbs[this->ibdPath_->hprior.stateIdx[i]][i], (double)1.0); + CPPUNIT_ASSERT_EQUAL(this->ibdPath3_->ibdTransProbs[this->ibdPath3_->hprior.stateIdx[i]][i], (double)1.0); } } void testComputeUniqueEffectiveKCount(){ //vector tmpPlaf = vector ({0.1, 0.2, 0.3}); - //CPPUNIT_ASSERT_NO_THROW(this->ibdPath_->hprior.buildHprior(5, tmpPlaf)); - CPPUNIT_ASSERT_NO_THROW(this->ibdPath2_->computeUniqueEffectiveKCount()); - CPPUNIT_ASSERT_EQUAL(this->ibdPath2_->uniqueEffectiveKCount.size(), (size_t)5); + //CPPUNIT_ASSERT_NO_THROW(this->ibdPath3_->hprior.buildHprior(5, tmpPlaf)); + CPPUNIT_ASSERT_NO_THROW(this->ibdPath5_->computeUniqueEffectiveKCount()); + CPPUNIT_ASSERT_EQUAL(this->ibdPath5_->uniqueEffectiveKCount.size(), (size_t)5); //> table(make.ibd.mat.joe(5)$k.eff) //1 2 3 4 5 //1 15 25 10 1 - CPPUNIT_ASSERT_EQUAL(this->ibdPath2_->uniqueEffectiveKCount[0], (int)1); - CPPUNIT_ASSERT_EQUAL(this->ibdPath2_->uniqueEffectiveKCount[1], (int)15); - CPPUNIT_ASSERT_EQUAL(this->ibdPath2_->uniqueEffectiveKCount[2], (int)25); - CPPUNIT_ASSERT_EQUAL(this->ibdPath2_->uniqueEffectiveKCount[3], (int)10); - CPPUNIT_ASSERT_EQUAL(this->ibdPath2_->uniqueEffectiveKCount[4], (int)1); + CPPUNIT_ASSERT_EQUAL(this->ibdPath5_->uniqueEffectiveKCount[0], (int)1); + CPPUNIT_ASSERT_EQUAL(this->ibdPath5_->uniqueEffectiveKCount[1], (int)15); + CPPUNIT_ASSERT_EQUAL(this->ibdPath5_->uniqueEffectiveKCount[2], (int)25); + CPPUNIT_ASSERT_EQUAL(this->ibdPath5_->uniqueEffectiveKCount[3], (int)10); + CPPUNIT_ASSERT_EQUAL(this->ibdPath5_->uniqueEffectiveKCount[4], (int)1); } void testIBDconfigureHeader(){ - vector headerOf3Strain = this->ibdPath_->getIBDprobsHeader(); + vector headerOf3Strain = this->ibdPath3_->getIBDprobsHeader(); CPPUNIT_ASSERT_EQUAL((size_t)5, headerOf3Strain.size()); CPPUNIT_ASSERT("0-1-2" == headerOf3Strain[0]); CPPUNIT_ASSERT("0-2-2" == headerOf3Strain[1]); @@ -358,6 +371,44 @@ class TestIBDpath : public CppUnit::TestCase { CPPUNIT_ASSERT("2-2-2" == headerOf3Strain[3]); CPPUNIT_ASSERT("1-1-2" == headerOf3Strain[4]); } + + + void testStatePrior(){ + //vector effectiveKPrior = this->ibdPath3_->computeEffectiveKPrior(this->ibdPath3_->theta()); + vector effectiveKPrior = vector (this->ibdPath3_->hprior.nPattern(), 1.0/this->ibdPath3_->hprior.nPattern()); + //for (double p : effectiveKPrior){cout< statePrior = this->ibdPath3_->computeStatePrior(effectiveKPrior); + //for (double p : statePrior){cout< effectiveKPrior = vector (this->ibdPath3_->hprior.nPattern(), 1.0/this->ibdPath3_->hprior.nPattern()); + //for (double p : effectiveKPrior){cout< statePrior = this->ibdPath3_->computeStatePrior(effectiveKPrior); + this->ibdPath3_->computeIbdPathFwdProb(vector ({.5, .25, .25}), statePrior); + vector tmp =this->ibdPath3_->fm[5]; + normalizeBySum(tmp); + for (double p:tmp) printf("%8.2f\n", p); + } + + void checkBwd(){ + vector effectiveKPrior = vector (this->ibdPath2_->hprior.nPattern(), 1.0/this->ibdPath2_->hprior.nPattern()); + //for (double p : effectiveKPrior){cout< statePrior = this->ibdPath2_->computeStatePrior(effectiveKPrior); + this->ibdPath2_->computeIbdPathBwdProb(vector ({.5, .5}), effectiveKPrior, statePrior); + for (size_t i = 0; i < 6; i++){ + vector tmp =this->ibdPath2_->bwd[i]; + normalizeBySum(tmp); + } + for (size_t i = 0; i < 6; i++){ + for (size_t j = 0; j < 5; j++){ + printf("%8.3f ", this->ibdPath2_->bwd[j][i]); + } + cout << endl; + //for (double p:tmp) printf("%8.3f\n", p); + } + } + }; CPPUNIT_TEST_SUITE_REGISTRATION(TestIBDUtility);