in simple_game/cfr_opt.h [104:130]
void computeStrategy() {
// Chance Player won't optimize its strategy.
if (isChancePlayer_) {
reachPr_ = 0;
return;
}
addMulti(sumStrategy_, strategy_, reachPr_);
reachPr_ = 0;
strategy_ = sumRegret_;
relu(strategy_);
if (normalize(strategy_)) return;
// Exploration
uniform(strategy_);
if (exploreFactor_ > 0) {
for (int i = 0; i < numAction_; ++i) {
strategy_[i] += gen_(rng_);
}
}
if (exploreFactor_ > 0) {
relu(strategy_);
normalize(strategy_);
}
}