C++ (Cpp) MCTSNode::update 예제들

프로그래밍 언어: C++ (Cpp)

클래스/타입: MCTSNode

메소드/함수: update

hotexamples.com에서의 예제들: 2

C++ (Cpp) MCTSNode::update - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 C++ (Cpp)의 MCTSNode::update에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

update(2)

AddChild(1)

orphanize(1)

terminal(1)

state(1)

simulate(1)

select(1)

reward(1)

q(1)

parent(1)

getMove(1)

Best(1)

expand(1)

action(1)

UCTSelectChild(1)

SetInvalidRAVE(1)

HasUntriedMoves(1)

HasChildren(1)

GetMu(1)

Eval(1)

ChooseRandomUntriedMove(1)

visits(1)

예제 #1

파일 보기

파일: PositionMonteCarloTreeSearch.cpp 프로젝트: petergar/madlenka

void PositionMonteCarloTreeSearch::go(unsigned int depth) {
    (void)depth; // depth wird hier nicht benötigt
    srand(time(NULL));
    MCTSNode *rootNode = new MCTSNode();
    int iterations=0;
    while(1) {
        PositionMonteCarloTreeSearch *rootPos = new PositionMonteCarloTreeSearch(*this);
        MCTSNode *selected = rootNode->select(rootPos);
        MCTSNode *expanded = selected->expand(rootPos);
        double result = expanded->simulate(rootPos);
        expanded->update(result);
        iterations++;
        if (iterations%100==0) {
            if (timer.isTimeout() || timer.checkTimeout())
                break;
        }
        delete rootPos;
    }
    string foundMove=rootNode->getMove();
    delete rootNode;
    
    /************************************
     * Das Ergebnis der Suche ausgeben. *
     ************************************/
    timer.stopTimer();
    double seconds = timer.getStartEndDiffSeconds();
    cout << "Move: " << foundMove << endl;
    cout << "Time: " << seconds << " seconds" << endl;
    cout << "bestmove " << foundMove << endl;
}

예제 #2

파일 보기

파일: mcts.cpp 프로젝트: ikoryakovskiy/grl

void MCTSPolicy::act(double time, const Observation &in, Action *out)
{
  // Clear tree at start of episode
  if (time == 0.)
  {
    safe_delete(&root_);
    trunk_ = NULL;
  }

  // Try warm start
  if (trunk_ && trunk_->children())
  {
    double maxdiff = 0;
    MCTSNode *selected = trunk_->select(0);
    Vector predicted = selected->state();
    
    for (size_t ii=0; ii < in.size(); ++ii)
      maxdiff = fmax(maxdiff, fabs(in[ii]-predicted[ii]));
      
    if (maxdiff < 0.05)
    {
      trunk_ = selected;
      selected->orphanize();

      CRAWL("Trunk set to selected state " << trunk_->state());
    }
    else
    {
      safe_delete(&root_);
      trunk_ = NULL;
      TRACE("Cannot use warm start: predicted state " << predicted << " differs from actual state " << in);
    }
  }

  // Allocate new tree if warm start was not possible
  if (!trunk_)
  {
    allocate();
    root_->init(NULL, 0, in, 0, false);
    root_->allocate(discretizer_->size(in));
    trunk_ = root_;
  }
  
  CRAWL("Trunk set to state " << trunk_->state());

  // Search until budget is up
  timer t;
  size_t searches=0;

  while (t.elapsed() < budget_)
  {
    MCTSNode *node = treePolicy(), *it=node;
    size_t depth=0;
    
    while ((it = it->parent()))
      depth++;
    
    double reward = 0;
    
    CRAWL("Tree policy selected node with state " << node->state() << " at depth " << depth);
    
    if (!node->terminal() && depth < horizon_)
      reward = defaultPolicy(node->state(), horizon_-depth);
     
    CRAWL("Default policy got reward " << reward);

    do
    {
      node->update(reward);
      reward = gamma_*reward + node->reward();
    } while ((node = node->parent()));
    
    searches++;
  }
  
  // Select best action
  if (trunk_->children())
  {
    MCTSNode *node = trunk_->select(0);
    *out = discretizer_->at(trunk_->state(), node->action());
    out->type = atGreedy;

    TRACE("Selected action " << *out << " (Q " << node->q()/node->visits() << ") after " << searches << " searches");
  }
  else
  {
    *out = discretizer_->at(in, lrand48()%discretizer_->size(in));
    out->type = atExploratory;

    TRACE("Selected random action " << *out);
  }
}