Commit 90e81581 authored by Timothy LAIRD's avatar Timothy LAIRD

Debug Commit 2

parent ab11fe24
...@@ -14,31 +14,55 @@ import java.util.Random; ...@@ -14,31 +14,55 @@ import java.util.Random;
* @author timot * @author timot
*/ */
public class AlgoRechercheMCTS extends AlgoRecherche { public class AlgoRechercheMCTS extends AlgoRecherche {
ArbreMCTS search; private final ArbreMCTS search;
int maxIterations; private final int maxIterations;
private final Random seed;
private ArrayList<Integer> chemin;
private final double coeff;
public AlgoRechercheMCTS(Joueur player, Joueur opponent, int m){ public AlgoRechercheMCTS(Joueur player, Joueur opponent, int m, double c){
search = new ArbreMCTS(player, opponent); search = new ArbreMCTS(player, opponent);
maxIterations = m; maxIterations = m;
seed = new Random();
coeff = c;
} }
@Override @Override
public Coup meilleurCoup(Plateau _plateau, Joueur _joueur, boolean _ponder) { public Coup meilleurCoup(Plateau _plateau, Joueur _joueur, boolean _ponder) {
Coup lastPlayed = _plateau.getDernierCoup();
if(search.root().coup() == null){
search.root().coup(lastPlayed);
expansion(search.root(), _plateau);
}
Node tmp = null;
Iterator<Node> children = search.root().children().iterator();
if(lastPlayed != null){
while(children.hasNext()){
tmp = children.next();
if(tmp.coup().equals(lastPlayed)){
search.root(tmp);
}
}
}
Node root = search.root(); Node root = search.root();
_plateau.sauvegardePosition(0); _plateau.sauvegardePosition(0);
int iterations = 0; int iterations = 0;
Random seed = new Random(); int trivial = 0;
while(iterations < maxIterations){ while(iterations < maxIterations){
iterations++; iterations++;
Node nextNode = selection(root); chemin = new ArrayList<>();
Node nextNode = selection(root, _plateau);
if(!_plateau.partieTerminee()){ if(!_plateau.partieTerminee()){
expansion(nextNode, _plateau); expansion(nextNode, _plateau);
trivial++;
} }
if(!nextNode.children().isEmpty()){ if(!nextNode.children().isEmpty()){
nextNode = nextNode.children().get(seed.nextInt(nextNode.children().size())); nextNode = nextNode.children().get(seed.nextInt(nextNode.children().size()));
_plateau.joueCoup(nextNode.coup());
} }
Joueur winner = simulate(nextNode, _plateau); Joueur winner = simulate(nextNode, _plateau);
update(winner, nextNode); backPropagation(root, winner);
_plateau.restaurePosition(0); _plateau.restaurePosition(0);
} }
Node nextPlay = root.nextPlay(); Node nextPlay = root.nextPlay();
...@@ -46,12 +70,32 @@ public class AlgoRechercheMCTS extends AlgoRecherche { ...@@ -46,12 +70,32 @@ public class AlgoRechercheMCTS extends AlgoRecherche {
return nextPlay.coup(); return nextPlay.coup();
} }
private Node selection(Node root){ public Node selection(Node n, Plateau pl){
Node currentNode = root; if (n.children().isEmpty()){
while(!(currentNode.children().isEmpty())){ return n;
currentNode = Fraction.bestChild(currentNode);
} }
return currentNode; else {
double valMax=Double.NEGATIVE_INFINITY;
int indiceSelection=0;
ArrayList<Node> f = n.children();
double val;
for(int i = 0; i < f.size(); i++){
Node nf = f.get(i);
if(nf.visits() == 0){
val = Double.MAX_VALUE;
}else{
val = (nf.wins()/nf.visits())+coeff*Math.sqrt(Math.log(n.visits())/nf.visits());
}
if (val>valMax){
indiceSelection=i;
valMax=val;
}
}
Node noeudSelectionne=f.get(indiceSelection);
pl.joueCoup(noeudSelectionne.coup());
chemin.add(indiceSelection);
return selection(noeudSelectionne, pl);
}
} }
private void expansion(Node leaf, Plateau leafPlateau){ private void expansion(Node leaf, Plateau leafPlateau){
...@@ -68,7 +112,6 @@ public class AlgoRechercheMCTS extends AlgoRecherche { ...@@ -68,7 +112,6 @@ public class AlgoRechercheMCTS extends AlgoRecherche {
private Joueur simulate(Node node, Plateau board){ private Joueur simulate(Node node, Plateau board){
Joueur p1 = node.player();Joueur p2 = node.opponent(); Joueur p1 = node.player();Joueur p2 = node.opponent();
Joueur currentPlayer = node.player(); Joueur currentPlayer = node.player();
Random seed = new Random();
Coup coup; Coup coup;
ArrayList<Coup> coups; ArrayList<Coup> coups;
while(!board.partieTerminee()){ while(!board.partieTerminee()){
...@@ -84,14 +127,19 @@ public class AlgoRechercheMCTS extends AlgoRecherche { ...@@ -84,14 +127,19 @@ public class AlgoRechercheMCTS extends AlgoRecherche {
return board.vainqueur(); return board.vainqueur();
} }
private void update(Joueur winner, Node node){ public void backPropagation(Node n, Joueur gagnant){
Node currentNode = node; Node currentNode = n; int index = 0;
while(currentNode != null){ do{
currentNode.addVisit(); currentNode.addVisit();
if(currentNode.player().equals(winner)){ if (currentNode.player().equals(gagnant)){
currentNode.addWin(); currentNode.addWin();
} }
currentNode = currentNode.parent(); currentNode = currentNode.children().get(chemin.get(index));
index++;
}while(index < chemin.size());
currentNode.addVisit();
if (currentNode.player().equals(gagnant)){
currentNode.addWin();
} }
} }
......
...@@ -10,7 +10,7 @@ package tictactoecodingame; ...@@ -10,7 +10,7 @@ package tictactoecodingame;
* @author timot * @author timot
*/ */
public class ArbreMCTS { public class ArbreMCTS {
Node root; private Node root;
public ArbreMCTS(Joueur pl, Joueur o){ public ArbreMCTS(Joueur pl, Joueur o){
root = new Node(null, pl, o); root = new Node(null, pl, o);
......
...@@ -12,12 +12,12 @@ import java.util.Iterator; ...@@ -12,12 +12,12 @@ import java.util.Iterator;
* @author timot * @author timot
*/ */
public class Node { public class Node {
Coup coup; private Coup coup;
Joueur player; private final Joueur player;
Joueur opponent; private final Joueur opponent;
int visits = 0; private int visits = 0;
int wins = 0; private int wins = 0;
ArrayList<Node> children; private final ArrayList<Node> children;
public Node(Coup c, Joueur pl, Joueur o){ public Node(Coup c, Joueur pl, Joueur o){
coup = c; coup = c;
...@@ -46,9 +46,13 @@ public class Node { ...@@ -46,9 +46,13 @@ public class Node {
return children; return children;
} }
public Coup coup(){ public Coup coup(){
return coup; return coup;
} }
public void coup(Coup c){
coup = c;
}
public void addVisit(){ public void addVisit(){
visits++; visits++;
...@@ -57,20 +61,24 @@ public class Node { ...@@ -57,20 +61,24 @@ public class Node {
public void addWin(){ public void addWin(){
wins++; wins++;
} }
public double winrate(){
if(visits == 0){
return 0;
}else{
return wins/visits;
}
}
public Node nextPlay(){ public Node nextPlay(){
Node bestNode = null; Node bestNode = null;
double winrate = 0; double winrate = Double.NEGATIVE_INFINITY;
Iterator<Node> child = children.iterator(); Iterator<Node> child = children.iterator();
Node currentNode; double currentWinrate; Node currentNode; double currentWinrate;
while(child.hasNext()){ while(child.hasNext()){
currentNode = child.next(); currentNode = child.next();
if(currentNode.visits == 0 ){ currentWinrate = currentNode.winrate();
currentWinrate = 0; if(currentWinrate > winrate){
}else{
currentWinrate = currentNode.wins() / currentNode.visits();
}
if( currentWinrate > winrate){
winrate = currentWinrate; winrate = currentWinrate;
bestNode = currentNode; bestNode = currentNode;
} }
......
...@@ -18,7 +18,7 @@ public class Player { ...@@ -18,7 +18,7 @@ public class Player {
// Remplacer ici l'algorithme aléatoire par votre algorithme. // Remplacer ici l'algorithme aléatoire par votre algorithme.
// Créer une nouvelle classe qui hérite de la class AlgoRecherche // Créer une nouvelle classe qui hérite de la class AlgoRecherche
AlgoRechercheMCTS alea = new AlgoRechercheMCTS(joueurOrdi, humain, 100); // L'ordinateur joue au hasard AlgoRechercheMCTS alea = new AlgoRechercheMCTS(joueurOrdi, humain, 1000,0.1);
joueurOrdi.setAlgoRecherche(alea); joueurOrdi.setAlgoRecherche(alea);
GrilleTicTacToe3x3 grille = new GrilleTicTacToe3x3(); GrilleTicTacToe3x3 grille = new GrilleTicTacToe3x3();
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment