00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036
00037
00038
00039
00040
00041
00042
00043
00044
00045
00046
00047
00048
00049
00050
00051
00052
00053
00054
00055
00056
00057
00058
00059
00060
00061
00062
00063
00064
00065
00066 #ifndef GIBBSSAMPLER_H_
00067 #define GIBBSSAMPLER_H_
00068
00069 #include "mcmc.h"
00070 #include "gibbsparams.h"
00071 #include "maxwalksat.h"
00072 #include "convergencetest.h"
00073 #include "gelmanconvergencetest.h"
00074
00075
00076 enum WalksatType { NONE = 0, MAXWALKSAT = 1 };
00077
00078 const bool gibbsdebug = false;
00079
00083 class GibbsSampler : public MCMC
00084 {
00085 public:
00086
00093 GibbsSampler(VariableState* state, long int seed,
00094 const bool& trackClauseTrueCnts, GibbsParams* gibbsParams)
00095 : MCMC(state, seed, trackClauseTrueCnts, gibbsParams)
00096 {
00097
00098 gamma_ = gibbsParams->gamma;
00099 epsilonError_ = gibbsParams->epsilonError;
00100 fracConverged_ = gibbsParams->fracConverged;
00101 walksatType_ = gibbsParams->walksatType;
00102 testConvergence_ = gibbsParams->testConvergence;
00103 samplesPerTest_ = gibbsParams->samplesPerTest;
00104
00105
00106 mws_ = new MaxWalkSat(state_, seed, false, gibbsParams->mwsParams);
00107 }
00108
00112 ~GibbsSampler()
00113 {
00114 deleteConvergenceTests(burnConvergenceTests_, gibbsConvergenceTests_,
00115 state_->getNumAtoms());
00116 delete mws_;
00117 }
00118
00122 void init()
00123 {
00124
00125 initTruthValuesAndWts(numChains_);
00126
00127 cout << "Initializing Gibbs sampling " ;
00128
00129 if (walksatType_ == 1)
00130 {
00131 cout << "with MaxWalksat" << endl;
00132 for (int c = 0; c < numChains_; c++)
00133 {
00134 cout << "for chain " << c << "..." << endl;
00135 mws_->init();
00136 mws_->infer();
00137 saveLowStateToChain(c);
00138 }
00139 if (numChains_ == 1) state_->saveLowStateToGndPreds();
00140 }
00141
00142 else
00143 {
00144 cout << "randomly" << endl;
00145 randomInitGndPredsTruthValues(numChains_);
00146 }
00147
00148
00149
00150 initNumTrueLits(numChains_);
00151
00152 int numGndPreds = state_->getNumAtoms();
00153
00154 initConvergenceTests(burnConvergenceTests_, gibbsConvergenceTests_,
00155 gamma_, epsilonError_, numGndPreds, numChains_);
00156 }
00157
00161 void infer()
00162 {
00163 initNumTrue();
00164 Timer timer;
00165
00166 bool burningIn = (burnMaxSteps_ > 0) ? true : false;
00167 double secondsElapsed = 0;
00168 double startTimeSec = timer.time();
00169 double currentTimeSec;
00170
00171
00172 if (trackClauseTrueCnts_)
00173 for (int clauseno = 0; clauseno < clauseTrueCnts_->size(); clauseno++)
00174 (*clauseTrueCnts_)[clauseno] = 0;
00175
00176
00177 GroundPredicateHashArray affectedGndPreds;
00178 Array<int> affectedGndPredIndices;
00179
00180 int numAtoms = state_->getNumAtoms();
00181 for (int i = 0; i < numAtoms; i++)
00182 {
00183 affectedGndPreds.append(state_->getGndPred(i), numAtoms);
00184 affectedGndPredIndices.append(i);
00185 }
00186 for (int c = 0; c < numChains_; c++)
00187 updateWtsForGndPreds(affectedGndPreds, affectedGndPredIndices, c);
00188 affectedGndPreds.clear();
00189 affectedGndPredIndices.clear();
00190
00191 cout << "Running Gibbs sampling..." << endl;
00192
00193 int sample = 0;
00194 int numSamplesPerPred = 0;
00195 bool done = false;
00196 while (!done)
00197 {
00198 ++sample;
00199
00200 if (sample % samplesPerTest_ == 0)
00201 {
00202 currentTimeSec = timer.time();
00203 secondsElapsed = currentTimeSec-startTimeSec;
00204 cout << "Sample (per pred per chain) " << sample << ", time elapsed = ";
00205 Timer::printTime(cout, secondsElapsed); cout << endl;
00206 }
00207
00208
00209 for (int c = 0; c < numChains_; c++)
00210 {
00211 performGibbsStep(c, burningIn, affectedGndPreds,
00212 affectedGndPredIndices);
00213 if (!burningIn) numSamplesPerPred++;
00214 }
00215
00216
00217 for (int i = 0; i < state_->getNumAtoms(); i++)
00218 {
00219 const bool* vals = truthValues_[i].getItems();
00220
00221 if (burningIn) burnConvergenceTests_[i]->appendNewValues(vals);
00222 else gibbsConvergenceTests_[i]->appendNewValues(vals);
00223 }
00224
00225 if (sample % samplesPerTest_ != 0) continue;
00226 if (burningIn)
00227 {
00228
00229
00230 bool burnConverged = false;
00231
00232 if (testConvergence_)
00233 burnConverged =
00234 GelmanConvergenceTest::checkConvergenceOfAll(burnConvergenceTests_,
00235 state_->getNumAtoms(),
00236 true);
00237 if ( (sample >= burnMinSteps_ && burnConverged)
00238 || (burnMaxSteps_ >= 0 && sample >= burnMaxSteps_)
00239 || (maxSeconds_ > 0 && secondsElapsed >= maxSeconds_))
00240 {
00241 cout << "Done burning. " << sample << " samples per pred per chain";
00242 if (testConvergence_)
00243 {
00244 cout << " (" << (burnConverged? "converged":"didn't converge")
00245 <<" at total of " << numChains_*sample << " samples per pred)";
00246 }
00247 cout << endl;
00248 burningIn = false;
00249 sample = 0;
00250 }
00251 }
00252 else
00253 {
00254 bool gibbsConverged = false;
00255
00256 if (testConvergence_)
00257 gibbsConverged =
00258 ConvergenceTest::checkConvergenceOfAtLeast(gibbsConvergenceTests_,
00259 state_->getNumAtoms(),
00260 sample, fracConverged_,
00261 true);
00262
00263 if ( (sample >= minSteps_ && gibbsConverged)
00264 || (maxSteps_ >= 0 && sample >= maxSteps_)
00265 || (maxSeconds_ > 0 && secondsElapsed >= maxSeconds_))
00266 {
00267 cout << "Done Gibbs sampling. " << sample
00268 << " samples per pred per chain";
00269 if (testConvergence_)
00270 {
00271 cout << " (" << (gibbsConverged? "converged":"didn't converge")
00272 <<" at total of " << numSamplesPerPred << " samples per pred)";
00273 }
00274 cout << endl;
00275 done = true;
00276 }
00277 }
00278 cout.flush();
00279 }
00280
00281 cout<< "Time taken for Gibbs sampling = ";
00282 Timer::printTime(cout, timer.time() - startTimeSec); cout << endl;
00283
00284
00285 for (int i = 0; i < state_->getNumAtoms(); i++)
00286 {
00287 setProbTrue(i, numTrue_[i] / numSamplesPerPred);
00288 }
00289
00290
00291 if (trackClauseTrueCnts_)
00292 {
00293
00294 for (int i = 0; i < clauseTrueCnts_->size(); i++)
00295 (*clauseTrueCnts_)[i] = (*clauseTrueCnts_)[i] / numSamplesPerPred;
00296 }
00297 }
00298
00299 private:
00300
00304 void initConvergenceTests(GelmanConvergenceTest**& burnConvergenceTests,
00305 ConvergenceTest**& gibbsConvergenceTests,
00306 const double& gamma, const double& epsilonFrac,
00307 const int& numGndPreds, const int& numChains)
00308 {
00309 burnConvergenceTests = new GelmanConvergenceTest*[numGndPreds];
00310 gibbsConvergenceTests = new ConvergenceTest*[numGndPreds];
00311 for (int i = 0; i < numGndPreds; i++)
00312 {
00313 burnConvergenceTests[i] = new GelmanConvergenceTest(numChains);
00314 gibbsConvergenceTests[i] = new ConvergenceTest(numChains, gamma,
00315 epsilonFrac);
00316 }
00317 }
00318
00322 void deleteConvergenceTests(GelmanConvergenceTest**& burnConvergenceTests,
00323 ConvergenceTest**& gibbsConvergenceTests,
00324 const int& numGndPreds)
00325 {
00326 for (int i = 0; i < numGndPreds; i++)
00327 {
00328 delete burnConvergenceTests[i];
00329 delete gibbsConvergenceTests[i];
00330 }
00331 delete [] burnConvergenceTests;
00332 delete [] gibbsConvergenceTests;
00333 }
00334
00335 private:
00336
00337 double gamma_;
00338
00339 double epsilonError_;
00340
00341 double fracConverged_;
00342
00343 int walksatType_;
00344
00345 int testConvergence_;
00346
00347 int samplesPerTest_;
00348
00349 GelmanConvergenceTest** burnConvergenceTests_;
00350
00351 ConvergenceTest** gibbsConvergenceTests_;
00352
00353
00354 MaxWalkSat* mws_;
00355 };
00356
00357 #endif