Substantial refactoring to implement correct Naive, UCT Monte Carlo tree search methods.
Removed unnecessary distinction between policy and tree search (tree search is a special kind of policy). Calculation of all valid moves / arbitrary sets of moves is now a seperate class, as it serves a different purpose than a policy. Introduced regression error in AlphaBeta test.
This commit is contained in:
34
src/net/woodyfolsom/msproj/policy/MonteCarloUCT.java
Normal file
34
src/net/woodyfolsom/msproj/policy/MonteCarloUCT.java
Normal file
@@ -0,0 +1,34 @@
|
||||
package net.woodyfolsom.msproj.policy;
|
||||
|
||||
|
||||
public class MonteCarloUCT extends MonteCarlo {
|
||||
|
||||
public MonteCarloUCT(Policy movePolicy, long searchTimeLimit) {
|
||||
super(movePolicy, searchTimeLimit);
|
||||
}
|
||||
|
||||
@Override
|
||||
public MonteCarloTreeNode descend(MonteCarloTreeNode node) {
|
||||
// TODO Auto-generated method stub
|
||||
return null;
|
||||
}
|
||||
|
||||
@Override
|
||||
public MonteCarloTreeNode grow(MonteCarloTreeNode node) {
|
||||
// TODO Auto-generated method stub
|
||||
return null;
|
||||
}
|
||||
|
||||
@Override
|
||||
public int rollout(MonteCarloTreeNode node) {
|
||||
// TODO Auto-generated method stub
|
||||
return 0;
|
||||
}
|
||||
|
||||
@Override
|
||||
public void update(MonteCarloTreeNode node, int reward) {
|
||||
// TODO Auto-generated method stub
|
||||
|
||||
}
|
||||
|
||||
}
|
||||
Reference in New Issue
Block a user