mcts v1, v2, v3, v4 done. v5 wip

2026-02-04 19:04:49 +00:00 · 2026-01-15 01:37:33 +01:00
parent d078a70950
commit 4e22c01bde
12 changed files with 1318 additions and 260 deletions
--- a/game/src/main/java/org/toop/game/players/ai/MCTSAI.java
+++ b/game/src/main/java/org/toop/game/players/ai/MCTSAI.java
@@ -1,193 +0,0 @@
-package org.toop.game.players.ai;
-
-import org.toop.framework.gameFramework.GameState;
-import org.toop.framework.gameFramework.model.game.PlayResult;
-import org.toop.framework.gameFramework.model.game.TurnBasedGame;
-import org.toop.framework.gameFramework.model.player.AbstractAI;
-
-import java.util.Random;
-
-public class MCTSAI extends AbstractAI {
-	private static class Node {
-		public TurnBasedGame state;
-		public long move;
-
-		public Node parent;
-
-		public int expanded;
-		public Node[] children;
-
-		public int visits;
-		public float value;
-
-		public Node(TurnBasedGame state, long move, Node parent) {
-			this.state = state;
-			this.move = move;
-
-			this.parent = parent;
-
-			this.expanded = 0;
-			this.children = new Node[Long.bitCount(state.getLegalMoves())];
-
-			this.visits = 0;
-			this.value = 0.0f;
-		}
-
-		public Node(TurnBasedGame state) {
-			this(state, 0L, null);
-		}
-
-		public boolean isFullyExpanded() {
-			return expanded >= children.length;
-		}
-
-		float calculateUCT() {
-			float exploitation = visits <= 0? 0 : value / visits;
-			float exploration = 1.41f * (float)(Math.sqrt(Math.log(visits) / visits));
-
-			return exploitation + exploration;
-		}
-
-		public Node bestUCTChild() {
-			int bestChildIndex = -1;
-			float bestScore = Float.NEGATIVE_INFINITY;
-
-			for (int i = 0; i < expanded; i++) {
-				final float score = calculateUCT();
-
-				if (score > bestScore) {
-					bestChildIndex = i;
-					bestScore = score;
-				}
-			}
-
-			return bestChildIndex >= 0? children[bestChildIndex] : this;
-		}
-	}
-
-	private final int milliseconds;
-
-	public MCTSAI(int milliseconds) {
-		this.milliseconds = milliseconds;
-	}
-
-	public MCTSAI(MCTSAI other) {
-		this.milliseconds = other.milliseconds;
-	}
-
-	@Override
-	public MCTSAI deepCopy() {
-		return new MCTSAI(this);
-	}
-
-	@Override
-	public long getMove(TurnBasedGame game) {
-		Node root = new Node(game.deepCopy());
-
-		long endTime = System.currentTimeMillis() + milliseconds;
-
-		while (System.currentTimeMillis() <= endTime) {
-			Node node = selection(root);
-			long legalMoves = node.state.getLegalMoves();
-
-			if (legalMoves != 0) {
-				node = expansion(node, legalMoves);
-			}
-
-			float result = 0.0f;
-
-			if (node.state.getLegalMoves() != 0) {
-				result = simulation(node.state, game.getCurrentTurn());
-			}
-
-			backPropagation(node, result);
-		}
-
-		int mostVisitedIndex = -1;
-		int mostVisits = -1;
-
-		for (int i = 0; i < root.expanded; i++) {
-			if (root.children[i].visits > mostVisits) {
-				mostVisitedIndex = i;
-				mostVisits = root.children[i].visits;
-			}
-		}
-
-		return mostVisitedIndex != -1? root.children[mostVisitedIndex].move : randomSetBit(game.getLegalMoves());
-	}
-
-	private Node selection(Node node) {
-		while (node.state.getLegalMoves() != 0L && node.isFullyExpanded()) {
-			node = node.bestUCTChild();
-		}
-
-		return node;
-	}
-
-	private Node expansion(Node node, long legalMoves) {
-		for (int i = 0; i < node.expanded; i++) {
-			legalMoves &= ~node.children[i].move;
-		}
-
-		if (legalMoves == 0L) {
-			return node;
-		}
-
-		long move = randomSetBit(legalMoves);
-
-		TurnBasedGame copy = node.state.deepCopy();
-		copy.play(move);
-
-		Node newlyExpanded = new Node(copy, move, node);
-
-		node.children[node.expanded] = newlyExpanded;
-		node.expanded++;
-
-		return newlyExpanded;
-	}
-
-	private float simulation(TurnBasedGame state, int playerIndex) {
-		TurnBasedGame copy = state.deepCopy();
-		long legalMoves = copy.getLegalMoves();
-		PlayResult result = null;
-
-		while (legalMoves != 0) {
-			result = copy.play(randomSetBit(legalMoves));
-			legalMoves = copy.getLegalMoves();
-		}
-
-		if (result.state() == GameState.WIN) {
-			if (result.player() == playerIndex) {
-				return 1.0f;
-			}
-
-			return -1.0f;
-		}
-
-		return -0.2f;
-	}
-
-	private void backPropagation(Node node, float value) {
-		while (node != null) {
-			node.visits++;
-			node.value += value;
-			node = node.parent;
-		}
-	}
-
-	public static long randomSetBit(long value) {
-		Random random = new Random();
-
-		int count = Long.bitCount(value);
-		int target = random.nextInt(count);
-
-		while (true) {
-			int bit = Long.numberOfTrailingZeros(value);
-			if (target == 0) {
-				return 1L << bit;
-			}
-			value &= value - 1;
-			target--;
-		}
-	}
-}
--- a/game/src/main/java/org/toop/game/players/ai/MCTSAI1.java
+++ b/game/src/main/java/org/toop/game/players/ai/MCTSAI1.java
@@ -0,0 +1,250 @@
+package org.toop.game.players.ai;
+
+import org.toop.framework.gameFramework.model.game.TurnBasedGame;
+import org.toop.framework.gameFramework.model.player.AbstractAI;
+
+import java.util.Random;
+
+public class MCTSAI1<T extends TurnBasedGame<T>> extends AbstractAI<T> {
+	private static class Node {
+		public TurnBasedGame<?> state;
+
+		public long move;
+		public long unexpandedMoves;
+
+		public Node parent;
+
+		public Node[] children;
+		public int expanded;
+
+		public float value;
+		public int visits;
+
+		public boolean solved;
+		public float solvedValue;
+
+		public Node(TurnBasedGame<?> state, Node parent, long move) {
+			final long legalMoves = state.getLegalMoves();
+
+			this.state = state;
+
+			this.move = move;
+			this.unexpandedMoves = legalMoves;
+
+			this.parent = parent;
+
+			this.children = new Node[Long.bitCount(legalMoves)];
+			this.expanded = 0;
+
+			this.value = 0.0f;
+			this.visits = 0;
+
+			this.solved = false;
+			this.solvedValue = 0.0f;
+		}
+
+		public Node(TurnBasedGame<?> state) {
+			this(state, null, 0L);
+		}
+
+		public boolean isFullyExpanded() {
+			return expanded == children.length;
+		}
+
+		public float calculateUCT(int parentVisits) {
+			if (visits == 0) {
+				return Float.POSITIVE_INFINITY;
+			}
+
+			final float exploitation = value / visits;
+			final float exploration = 1.41f * (float)(Math.sqrt(Math.log(parentVisits) / visits));
+
+			return exploitation + exploration;
+		}
+
+		public Node bestUCTChild() {
+			Node highestUCTChild = null;
+			float highestUCT = Float.NEGATIVE_INFINITY;
+
+			for (int i = 0; i < expanded; i++) {
+				final float childUCT = children[i].calculateUCT(visits);
+
+				if (childUCT > highestUCT) {
+					highestUCTChild = children[i];
+					highestUCT = childUCT;
+				}
+			}
+
+			return highestUCTChild;
+		}
+	}
+
+	private static final Random random = new Random();
+
+	private final int milliseconds;
+
+	public MCTSAI1(int milliseconds) {
+		this.milliseconds = milliseconds;
+	}
+
+	public MCTSAI1(MCTSAI1<T> other) {
+		this.milliseconds = other.milliseconds;
+	}
+
+	@Override
+	public MCTSAI1<T> deepCopy() {
+		return new MCTSAI1<>(this);
+	}
+
+	@Override
+	public long getMove(T game) {
+		final Node root = new Node(game, null, 0L);
+
+		final long endTime = System.nanoTime() + milliseconds * 1_000_000L;
+
+		while (System.nanoTime() < endTime) {
+			Node leaf = selection(root);
+			leaf = expansion(leaf);
+			final float value = simulation(leaf);
+			backPropagation(leaf, value);
+		}
+
+		final Node mostVisitedChild = mostVisitedChild(root);
+		return mostVisitedChild.move;
+	}
+
+	private Node mostVisitedChild(Node root) {
+		Node mostVisitedChild = null;
+		int mostVisited = -1;
+
+		for (int i = 0; i < root.expanded; i++) {
+			if (root.children[i].visits > mostVisited) {
+				mostVisitedChild = root.children[i];
+				mostVisited = root.children[i].visits;
+			}
+		}
+
+		return mostVisitedChild;
+	}
+
+	private Node selection(Node root) {
+		while (!root.solved && root.isFullyExpanded() && !root.state.isTerminal()) {
+			root = root.bestUCTChild();
+		}
+
+		return root;
+	}
+
+	private Node expansion(Node leaf) {
+		if (leaf.unexpandedMoves == 0L) {
+			return leaf;
+		}
+
+		final long unexpandedMove = leaf.unexpandedMoves & -leaf.unexpandedMoves;
+
+		final TurnBasedGame<?> copiedState = leaf.state.deepCopy();
+		copiedState.play(unexpandedMove);
+
+		final Node expandedChild = new Node(copiedState, leaf, unexpandedMove);
+
+		leaf.children[leaf.expanded] = expandedChild;
+		leaf.expanded++;
+
+		leaf.unexpandedMoves &= ~unexpandedMove;
+
+		return expandedChild;
+	}
+
+	private float simulation(Node leaf) {
+		final TurnBasedGame<?> copiedState = leaf.state.deepCopy();
+		final int playerIndex = 1 - copiedState.getCurrentTurn();
+
+		while (!copiedState.isTerminal()) {
+			final long legalMoves = copiedState.getLegalMoves();
+			final long randomMove = randomSetBit(legalMoves);
+
+			copiedState.play(randomMove);
+		}
+
+		if (copiedState.getWinner() == playerIndex) {
+			return 1.0f;
+		}
+
+		if (copiedState.getWinner() >= 0) {
+			return -1.0f;
+		}
+
+		return 0.0f;
+	}
+
+	private void backPropagation(Node leaf, float value) {
+		while (leaf != null) {
+			leaf.value += value;
+			leaf.visits++;
+
+			if (!leaf.solved) {
+				updateSolvedStatus(leaf);
+			}
+
+			value = -value;
+			leaf = leaf.parent;
+		}
+	}
+
+	private void updateSolvedStatus(Node node) {
+		if (node.state.isTerminal()) {
+			node.solved = true;
+
+			final int winner = node.state.getWinner();
+			final int mover = 1 - node.state.getCurrentTurn();
+
+			node.solvedValue = winner == mover? 1.0f : winner == -1? 0.0f : -1.0f;
+
+			return;
+		}
+
+		if (node.isFullyExpanded()) {
+			boolean allChildrenSolved = true;
+			boolean foundWinningMove = false;
+			boolean foundDrawMove = false;
+
+			for (final Node child : node.children) {
+				if (child.solved) {
+					if (child.solvedValue == -1.0f) {
+						foundWinningMove = true;
+						break;
+					}
+
+					if (child.solvedValue == 0.0f) {
+						foundDrawMove = true;
+					}
+				} else {
+					allChildrenSolved = false;
+				}
+			}
+
+			if (foundWinningMove) {
+				node.solved = true;
+				node.solvedValue = 1.0f;
+			} else if (allChildrenSolved) {
+				node.solved = true;
+				node.solvedValue = foundDrawMove? 0.0f : -1.0f;
+			}
+		}
+	}
+
+	private long randomSetBit(long value) {
+		if (0L == value) {
+			return 0;
+		}
+
+		final int bitCount = Long.bitCount(value);
+		final int randomBitCount = random.nextInt(bitCount);
+
+		for (int i = 0; i < randomBitCount; i++) {
+			value &= value - 1;
+		}
+
+		return value & -value;
+	}
+}
--- a/game/src/main/java/org/toop/game/players/ai/MCTSAI2.java
+++ b/game/src/main/java/org/toop/game/players/ai/MCTSAI2.java
@@ -35,6 +35,9 @@ public class MCTSAI2 extends AbstractAI {

 			this.value = 0.0f;
 			this.visits = 0;
+
+			this.solved = false;
+			this.solvedValue = 0.0f;
 		}

 		public Node(TurnBasedGame state) {
@@ -46,6 +49,10 @@ public class MCTSAI2 extends AbstractAI {
 		}

 		public float calculateUCT(int parentVisits) {
+			if (visits == 0) {
+				return Float.POSITIVE_INFINITY;
+			}
+
 			final float exploitation = value / visits;
 			final float exploration = 1.41f * (float)(Math.sqrt(Math.log(parentVisits) / visits));

@@ -63,24 +70,29 @@ public class MCTSAI2 extends AbstractAI {
 					highestUCTChild = children[i];
 					highestUCT = childUCT;
 				}
-
 			}

 			return highestUCTChild;
 		}
 	}

-	private final Random random;
+	private static final Random random = new Random();
+
 	private final int milliseconds;

+	private Node root;
+
 	public MCTSAI2(int milliseconds) {
-		this.random = new Random();
 		this.milliseconds = milliseconds;
+
+		this.root = null;
 	}

 	public MCTSAI2(MCTSAI2 other) {
 		this.random = other.random;
 		this.milliseconds = other.milliseconds;
+
+		this.root = other.root;
 	}

 	@Override
@@ -90,7 +102,7 @@ public class MCTSAI2 extends AbstractAI {

 	@Override
 	public long getMove(TurnBasedGame game) {
-		final Node root = new Node(game, null, 0L);
+        root = findOrResetRoot(root, game);

 		final long endTime = System.nanoTime() + milliseconds * 1_000_000L;

@@ -102,8 +114,11 @@ public class MCTSAI2 extends AbstractAI {
 		}

 		final Node mostVisitedChild = mostVisitedChild(root);
+		final long move = mostVisitedChild.move;

-		return mostVisitedChild != null? mostVisitedChild.move : 0L;
+		root = findChildByMove(root, move);
+
+		return move;
 	}

 	private Node mostVisitedChild(Node root) {
@@ -120,8 +135,51 @@ public class MCTSAI2 extends AbstractAI {
 		return mostVisitedChild;
 	}

+	private Node findOrResetRoot(Node root, T game) {
+		if (root == null) {
+			return new Node(game.deepCopy());
+		}
+
+		if (areStatesEqual(root.state.getBoard(), game.getBoard())) {
+			return root;
+		}
+
+		for (int i = 0; i < root.expanded; i++) {
+			if (areStatesEqual(root.children[i].state.getBoard(), game.getBoard())) {
+				root.children[i].parent = null;
+				return root.children[i];
+			}
+		}
+
+		return new Node(game.deepCopy());
+	}
+
+	private Node findChildByMove(Node root, long move) {
+		for (int i = 0; i < root.expanded; i++) {
+			if (root.children[i].move == move) {
+				root.children[i].parent = null;
+				return root.children[i];
+			}
+		}
+
+		return null;
+	}
+
+	private boolean areStatesEqual(long[] state1, long[] state2) {
+		if (state1.length != state2.length) {
+			return false;
+		}
+
+		for (int i = 0; i < state1.length; i++) {
+			if (state1[i] != state2[i]) {
+				return false;
+			}
+		}
+
+		return true;
+	}
 	private Node selection(Node root) {
-		while (root.isFullyExpanded() && !root.state.isTerminal()) {
+		while (!root.solved && root.isFullyExpanded() && !root.state.isTerminal()) {
 			root = root.bestUCTChild();
 		}

@@ -161,7 +219,9 @@ public class MCTSAI2 extends AbstractAI {

 		if (copiedState.getWinner() == playerIndex) {
 			return 1.0f;
-		} else if (copiedState.getWinner() >= 0) {
+		}
+
+		if (copiedState.getWinner() >= 0) {
 			return -1.0f;
 		}

@@ -173,11 +233,57 @@ public class MCTSAI2 extends AbstractAI {
 			leaf.value += value;
 			leaf.visits++;

+			if (!leaf.solved) {
+				updateSolvedStatus(leaf);
+			}
+
 			value = -value;
 			leaf = leaf.parent;
 		}
 	}

+	private void updateSolvedStatus(Node node) {
+		if (node.state.isTerminal()) {
+			node.solved = true;
+
+			final int winner = node.state.getWinner();
+			final int mover = 1 - node.state.getCurrentTurn();
+
+			node.solvedValue = winner == mover? 1.0f : winner == -1? 0.0f : -1.0f;
+
+			return;
+		}
+
+		if (node.isFullyExpanded()) {
+			boolean allChildrenSolved = true;
+			boolean foundWinningMove = false;
+			boolean foundDrawMove = false;
+
+			for (final Node child : node.children) {
+				if (child.solved) {
+					if (child.solvedValue == -1.0f) {
+						foundWinningMove = true;
+						break;
+					}
+
+					if (child.solvedValue == 0.0f) {
+						foundDrawMove = true;
+					}
+				} else {
+					allChildrenSolved = false;
+				}
+			}
+
+			if (foundWinningMove) {
+				node.solved = true;
+				node.solvedValue = 1.0f;
+			} else if (allChildrenSolved) {
+				node.solved = true;
+				node.solvedValue = foundDrawMove? 0.0f : -1.0f;
+			}
+		}
+	}
+
 	private long randomSetBit(long value) {
 		if (0L == value) {
 			return 0;
--- a/game/src/main/java/org/toop/game/players/ai/MCTSAI3.java
+++ b/game/src/main/java/org/toop/game/players/ai/MCTSAI3.java
@@ -3,7 +3,13 @@ package org.toop.game.players.ai;
 import org.toop.framework.gameFramework.model.game.TurnBasedGame;
 import org.toop.framework.gameFramework.model.player.AbstractAI;

+import java.util.ArrayList;
+import java.util.List;
 import java.util.Random;
+import java.util.concurrent.Callable;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+import java.util.concurrent.Future;

 public class MCTSAI3 extends AbstractAI {
 	private static class Node {
@@ -20,6 +26,9 @@ public class MCTSAI3 extends AbstractAI {
 		public float value;
 		public int visits;

+        public boolean solved;
+        public float solvedValue;
+
 		public Node(TurnBasedGame state, Node parent, long move) {
 			final long legalMoves = state.getLegalMoves();

@@ -35,6 +44,9 @@ public class MCTSAI3 extends AbstractAI {

 			this.value = 0.0f;
 			this.visits = 0;
+
+			this.solved = false;
+			this.solvedValue = 0.0f;
 		}

 		public Node(TurnBasedGame state) {
@@ -46,6 +58,10 @@ public class MCTSAI3 extends AbstractAI {
 		}

 		public float calculateUCT(int parentVisits) {
+			if (visits == 0) {
+				return Float.POSITIVE_INFINITY;
+			}
+
 			final float exploitation = value / visits;
 			final float exploration = 1.41f * (float)(Math.sqrt(Math.log(parentVisits) / visits));

@@ -63,23 +79,20 @@ public class MCTSAI3 extends AbstractAI {
 					highestUCTChild = children[i];
 					highestUCT = childUCT;
 				}
-
 			}

 			return highestUCTChild;
 		}
 	}

-	private final Random random;
+	private static final ThreadLocal<Random> random = ThreadLocal.withInitial(Random::new);

-	private Node root;
 	private final int milliseconds;
+	private final int threads;

-	public MCTSAI3(int milliseconds) {
-		this.random = new Random();
-
-		this.root = null;
+	public MCTSAI3(int milliseconds, int threads) {
 		this.milliseconds = milliseconds;
+		this.threads = threads;
 	}

 	public MCTSAI3(MCTSAI3 other) {
@@ -87,6 +100,7 @@ public class MCTSAI3 extends AbstractAI {

 		this.root = other.root;
 		this.milliseconds = other.milliseconds;
+		this.threads = other.threads;
 	}

 	@Override
@@ -95,24 +109,58 @@ public class MCTSAI3 extends AbstractAI {
 	}

 	@Override
-	public long getMove(TurnBasedGame game) {
-		detectRoot(game);
-
+	public long getMove(T game) {
+		final ExecutorService pool = Executors.newFixedThreadPool(threads);
 		final long endTime = System.nanoTime() + milliseconds * 1_000_000L;

-		while (System.nanoTime() < endTime) {
-			Node leaf = selection(root);
-			leaf = expansion(leaf);
-			final float value = simulation(leaf);
-			backPropagation(leaf, value);
+		final List<Callable<Node>> tasks = new ArrayList<>();
+
+		for (int i = 0; i < threads; i++) {
+			tasks.add(() -> {
+				final Node localRoot = new Node(game.deepCopy());
+
+				while (System.nanoTime() < endTime) {
+					Node leaf = selection(localRoot);
+					leaf = expansion(leaf);
+					final float value = simulation(leaf);
+					backPropagation(leaf, value);
+				}
+
+				return localRoot;
+			});
 		}

-		final Node mostVisitedChild = mostVisitedChild(root);
-		final long move = mostVisitedChild != null? mostVisitedChild.move : 0L;
+		try {
+			final List<Future<Node>> results = pool.invokeAll(tasks);

-		newRoot(move);
+			pool.shutdown();

-		return move;
+			final Node root = new Node(game.deepCopy());
+
+			for (int i = 0; i < root.children.length; i++) {
+				expansion(root);
+			}
+
+			for (final Future<Node> result : results) {
+				final Node localRoot = result.get();
+
+				for (final Node localChild : localRoot.children) {
+					for (int i = 0; i < root.children.length; i++) {
+						if (localChild.move == root.children[i].move) {
+							root.children[i].visits += localChild.visits;
+							root.visits += localChild.visits;
+							break;
+						}
+					}
+				}
+			}
+
+			final Node mostVisitedChild = mostVisitedChild(root);
+			return mostVisitedChild.move;
+		} catch (Exception _) {
+			final long legalMoves = game.getLegalMoves();
+			return randomSetBit(legalMoves);
+		}
 	}

 	private Node mostVisitedChild(Node root) {
@@ -184,7 +232,7 @@ public class MCTSAI3 extends AbstractAI {
 	}

 	private Node selection(Node root) {
-		while (root.isFullyExpanded() && !root.state.isTerminal()) {
+		while (!root.solved && root.isFullyExpanded() && !root.state.isTerminal()) {
 			root = root.bestUCTChild();
 		}

@@ -224,7 +272,9 @@ public class MCTSAI3 extends AbstractAI {

 		if (copiedState.getWinner() == playerIndex) {
 			return 1.0f;
-		} else if (copiedState.getWinner() >= 0) {
+		}
+
+		if (copiedState.getWinner() >= 0) {
 			return -1.0f;
 		}

@@ -236,18 +286,64 @@ public class MCTSAI3 extends AbstractAI {
 			leaf.value += value;
 			leaf.visits++;

+			if (!leaf.solved) {
+				updateSolvedStatus(leaf);
+			}
+
 			value = -value;
 			leaf = leaf.parent;
 		}
 	}

+	private void updateSolvedStatus(Node node) {
+		if (node.state.isTerminal()) {
+			node.solved = true;
+
+			final int winner = node.state.getWinner();
+			final int mover = 1 - node.state.getCurrentTurn();
+
+			node.solvedValue = winner == mover? 1.0f : winner == -1? 0.0f : -1.0f;
+
+			return;
+		}
+
+		if (node.isFullyExpanded()) {
+			boolean allChildrenSolved = true;
+			boolean foundWinningMove = false;
+			boolean foundDrawMove = false;
+
+			for (final Node child : node.children) {
+				if (child.solved) {
+					if (child.solvedValue == -1.0f) {
+						foundWinningMove = true;
+						break;
+					}
+
+					if (child.solvedValue == 0.0f) {
+						foundDrawMove = true;
+					}
+				} else {
+					allChildrenSolved = false;
+				}
+			}
+
+			if (foundWinningMove) {
+				node.solved = true;
+				node.solvedValue = 1.0f;
+			} else if (allChildrenSolved) {
+				node.solved = true;
+				node.solvedValue = foundDrawMove? 0.0f : -1.0f;
+			}
+		}
+	}
+
 	private long randomSetBit(long value) {
 		if (0L == value) {
 			return 0;
 		}

 		final int bitCount = Long.bitCount(value);
-		final int randomBitCount = random.nextInt(bitCount);
+		final int randomBitCount = random.get().nextInt(bitCount);

 		for (int i = 0; i < randomBitCount; i++) {
 			value &= value - 1;
--- a/game/src/main/java/org/toop/game/players/ai/MCTSAI4.java
+++ b/game/src/main/java/org/toop/game/players/ai/MCTSAI4.java
@@ -0,0 +1,359 @@
+package org.toop.game.players.ai;
+
+import org.toop.framework.gameFramework.model.game.TurnBasedGame;
+import org.toop.framework.gameFramework.model.player.AbstractAI;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Random;
+import java.util.concurrent.Callable;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+import java.util.concurrent.Future;
+
+public class MCTSAI4<T extends TurnBasedGame<T>> extends AbstractAI<T> {
+	private static class Node {
+		public TurnBasedGame<?> state;
+
+		public long move;
+		public long unexpandedMoves;
+
+		public Node parent;
+
+		public Node[] children;
+		public int expanded;
+
+		public float value;
+		public int visits;
+
+		public boolean solved;
+		public float solvedValue;
+
+		public Node(TurnBasedGame<?> state, Node parent, long move) {
+			final long legalMoves = state.getLegalMoves();
+
+			this.state = state;
+
+			this.move = move;
+			this.unexpandedMoves = legalMoves;
+
+			this.parent = parent;
+
+			this.children = new Node[Long.bitCount(legalMoves)];
+			this.expanded = 0;
+
+			this.value = 0.0f;
+			this.visits = 0;
+
+			this.solved = false;
+			this.solvedValue = 0.0f;
+		}
+
+		public Node(TurnBasedGame<?> state) {
+			this(state, null, 0L);
+		}
+
+		public boolean isFullyExpanded() {
+			return expanded == children.length;
+		}
+
+		public float calculateUCT(int parentVisits) {
+			if (visits == 0) {
+				return Float.POSITIVE_INFINITY;
+			}
+
+			final float exploitation = value / visits;
+			final float exploration = 1.41f * (float)(Math.sqrt(Math.log(parentVisits) / visits));
+
+			return exploitation + exploration;
+		}
+
+		public Node bestUCTChild() {
+			Node highestUCTChild = null;
+			float highestUCT = Float.NEGATIVE_INFINITY;
+
+			for (int i = 0; i < expanded; i++) {
+				final float childUCT = children[i].calculateUCT(visits);
+
+				if (childUCT > highestUCT) {
+					highestUCTChild = children[i];
+					highestUCT = childUCT;
+				}
+			}
+
+			return highestUCTChild;
+		}
+	}
+
+	private static final ThreadLocal<Random> random = ThreadLocal.withInitial(Random::new);
+
+	private final int milliseconds;
+	private final int threads;
+
+	private final Node[] threadRoots;
+
+	public MCTSAI4(int milliseconds, int threads) {
+		this.milliseconds = milliseconds;
+		this.threads = threads;
+
+		this.threadRoots = new Node[threads];
+	}
+
+	public MCTSAI4(MCTSAI4<T> other) {
+		this.milliseconds = other.milliseconds;
+		this.threads = other.threads;
+
+		this.threadRoots = other.threadRoots;
+	}
+
+	@Override
+	public MCTSAI4<T> deepCopy() {
+		return new MCTSAI4<>(this);
+	}
+
+	@Override
+	public long getMove(T game) {
+		for (int i = 0; i < threads; i++) {
+			threadRoots[i] = findOrResetRoot(threadRoots[i], game);
+		}
+
+		final ExecutorService pool = Executors.newFixedThreadPool(threads);
+		final long endTime = System.nanoTime() + milliseconds * 1_000_000L;
+
+		final List<Callable<Node>> tasks = new ArrayList<>();
+
+		for (int i = 0; i < threads; i++) {
+			final int threadIndex = i;
+
+			tasks.add(() -> {
+				final Node localRoot = threadRoots[threadIndex];
+
+				while (System.nanoTime() < endTime) {
+					Node leaf = selection(localRoot);
+					leaf = expansion(leaf);
+					final float value = simulation(leaf);
+					backPropagation(leaf, value);
+				}
+
+				return localRoot;
+			});
+		}
+
+		try {
+			final List<Future<Node>> results = pool.invokeAll(tasks);
+
+			pool.shutdown();
+
+			final Node root = new Node(game.deepCopy());
+
+			for (int i = 0; i < root.children.length; i++) {
+				expansion(root);
+			}
+
+			for (final Future<Node> result : results) {
+				final Node localRoot = result.get();
+
+				for (final Node localChild : localRoot.children) {
+					for (int i = 0; i < root.children.length; i++) {
+						if (localChild.move == root.children[i].move) {
+							root.children[i].visits += localChild.visits;
+							root.visits += localChild.visits;
+							break;
+						}
+					}
+				}
+			}
+
+			final Node mostVisitedChild = mostVisitedChild(root);
+			final long move = mostVisitedChild.move;
+
+			for (int i = 0; i < threads; i++) {
+				threadRoots[i] = findChildByMove(threadRoots[i], move);
+			}
+
+			return move;
+		} catch (Exception _) {
+			final long legalMoves = game.getLegalMoves();
+			return randomSetBit(legalMoves);
+		}
+	}
+
+	private Node mostVisitedChild(Node root) {
+		Node mostVisitedChild = null;
+		int mostVisited = -1;
+
+		for (int i = 0; i < root.expanded; i++) {
+			if (root.children[i].visits > mostVisited) {
+				mostVisitedChild = root.children[i];
+				mostVisited = root.children[i].visits;
+			}
+		}
+
+		return mostVisitedChild;
+	}
+
+	private Node findOrResetRoot(Node root, T game) {
+		if (root == null) {
+			return new Node(game.deepCopy());
+		}
+
+		if (areStatesEqual(root.state.getBoard(), game.getBoard())) {
+			return root;
+		}
+
+		for (int i = 0; i < root.expanded; i++) {
+			if (areStatesEqual(root.children[i].state.getBoard(), game.getBoard())) {
+				root.children[i].parent = null;
+				return root.children[i];
+			}
+		}
+
+		return new Node(game.deepCopy());
+	}
+
+	private Node findChildByMove(Node root, long move) {
+		for (int i = 0; i < root.expanded; i++) {
+			if (root.children[i].move == move) {
+				root.children[i].parent = null;
+				return root.children[i];
+			}
+		}
+
+		return null;
+	}
+
+	private boolean areStatesEqual(long[] state1, long[] state2) {
+		if (state1.length != state2.length) {
+			return false;
+		}
+
+		for (int i = 0; i < state1.length; i++) {
+			if (state1[i] != state2[i]) {
+				return false;
+			}
+		}
+
+		return true;
+	}
+
+	private Node selection(Node root) {
+		while (!root.solved && root.isFullyExpanded() && !root.state.isTerminal()) {
+			root = root.bestUCTChild();
+		}
+
+		return root;
+	}
+
+	private Node expansion(Node leaf) {
+		if (leaf.unexpandedMoves == 0L) {
+			return leaf;
+		}
+
+		final long unexpandedMove = leaf.unexpandedMoves & -leaf.unexpandedMoves;
+
+		final TurnBasedGame<?> copiedState = leaf.state.deepCopy();
+		copiedState.play(unexpandedMove);
+
+		final Node expandedChild = new Node(copiedState, leaf, unexpandedMove);
+
+		leaf.children[leaf.expanded] = expandedChild;
+		leaf.expanded++;
+
+		leaf.unexpandedMoves &= ~unexpandedMove;
+
+		return expandedChild;
+	}
+
+	private float simulation(Node leaf) {
+		final TurnBasedGame<?> copiedState = leaf.state.deepCopy();
+		final int playerIndex = 1 - copiedState.getCurrentTurn();
+
+		while (!copiedState.isTerminal()) {
+			final long legalMoves = copiedState.getLegalMoves();
+			final long randomMove = randomSetBit(legalMoves);
+
+			copiedState.play(randomMove);
+		}
+
+		if (copiedState.getWinner() == playerIndex) {
+			return 1.0f;
+		}
+
+		if (copiedState.getWinner() >= 0) {
+			return -1.0f;
+		}
+
+		return 0.0f;
+	}
+
+	private void backPropagation(Node leaf, float value) {
+		while (leaf != null) {
+			leaf.value += value;
+			leaf.visits++;
+
+			if (!leaf.solved) {
+				updateSolvedStatus(leaf);
+			}
+
+			value = -value;
+			leaf = leaf.parent;
+		}
+	}
+
+	private void updateSolvedStatus(Node node) {
+		if (node.state.isTerminal()) {
+			node.solved = true;
+
+			final int winner = node.state.getWinner();
+			final int mover = 1 - node.state.getCurrentTurn();
+
+			node.solvedValue = winner == mover? 1.0f : winner == -1? 0.0f : -1.0f;
+
+			return;
+		}
+
+		if (node.isFullyExpanded()) {
+			boolean allChildrenSolved = true;
+			boolean foundWinningMove = false;
+			boolean foundDrawMove = false;
+
+			for (final Node child : node.children) {
+				if (child.solved) {
+					if (child.solvedValue == -1.0f) {
+						foundWinningMove = true;
+						break;
+					}
+
+					if (child.solvedValue == 0.0f) {
+						foundDrawMove = true;
+					}
+				} else {
+					allChildrenSolved = false;
+				}
+			}
+
+			if (foundWinningMove) {
+				node.solved = true;
+				node.solvedValue = 1.0f;
+			} else if (allChildrenSolved) {
+				node.solved = true;
+				node.solvedValue = foundDrawMove? 0.0f : -1.0f;
+			}
+		}
+	}
+
+	private long randomSetBit(long value) {
+		if (0L == value) {
+			return 0;
+		}
+
+		final int bitCount = Long.bitCount(value);
+		final int randomBitCount = random.get().nextInt(bitCount);
+
+		for (int i = 0; i < randomBitCount; i++) {
+			value &= value - 1;
+		}
+
+		return value & -value;
+	}
+}
--- a/game/src/main/java/org/toop/game/players/ai/MCTSAI5.java
+++ b/game/src/main/java/org/toop/game/players/ai/MCTSAI5.java
@@ -0,0 +1,371 @@
+package org.toop.game.players.ai;
+
+import org.toop.framework.gameFramework.model.game.TurnBasedGame;
+import org.toop.framework.gameFramework.model.player.AbstractAI;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Random;
+import java.util.concurrent.Callable;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+import java.util.concurrent.Future;
+
+public class MCTSAI5<T extends TurnBasedGame<T>> extends AbstractAI<T> {
+	private static class Node {
+		public TurnBasedGame<?> state;
+
+		public long move;
+		public long unexpandedMoves;
+
+		public Node parent;
+
+		public Node[] children;
+		public int expanded;
+
+		public float value;
+		public int visits;
+
+		public boolean solved;
+		public float solvedValue;
+
+		public float heuristic;
+
+		public Node(TurnBasedGame<?> state, Node parent, long move) {
+			final long legalMoves = state.getLegalMoves();
+
+			this.state = state;
+
+			this.move = move;
+			this.unexpandedMoves = legalMoves;
+
+			this.parent = parent;
+
+			this.children = new Node[Long.bitCount(legalMoves)];
+			this.expanded = 0;
+
+			this.value = 0.0f;
+			this.visits = 0;
+
+			this.solved = false;
+			this.solvedValue = 0.0f;
+
+			this.heuristic = state.rateMove(move);
+		}
+
+		public Node(TurnBasedGame<?> state) {
+			this(state, null, 0L);
+		}
+
+		public boolean isFullyExpanded() {
+			return expanded == children.length;
+		}
+
+		public float calculateUCT(int parentVisits) {
+			if (visits == 0) {
+				return Float.POSITIVE_INFINITY;
+			}
+
+			final float exploitation = value / visits;
+			final float exploration = 1.41f * (float)(Math.sqrt(Math.log(parentVisits) / visits));
+			final float bias = heuristic / visits;
+
+			return exploitation + exploration + bias;
+		}
+
+		public Node bestUCTChild() {
+			Node highestUCTChild = null;
+			float highestUCT = Float.NEGATIVE_INFINITY;
+
+			for (int i = 0; i < expanded; i++) {
+				final float childUCT = children[i].calculateUCT(visits);
+
+				if (childUCT > highestUCT) {
+					highestUCTChild = children[i];
+					highestUCT = childUCT;
+				}
+			}
+
+			return highestUCTChild;
+		}
+	}
+
+	private static final ThreadLocal<Random> random = ThreadLocal.withInitial(Random::new);
+
+	private final int milliseconds;
+	private final int threads;
+
+	private final Node[] threadRoots;
+
+	public MCTSAI5(int milliseconds, int threads) {
+		this.milliseconds = milliseconds;
+		this.threads = threads;
+
+		this.threadRoots = new Node[threads];
+	}
+
+	public MCTSAI5(MCTSAI5<T> other) {
+		this.milliseconds = other.milliseconds;
+		this.threads = other.threads;
+
+		this.threadRoots = other.threadRoots;
+	}
+
+	@Override
+	public MCTSAI5<T> deepCopy() {
+		return new MCTSAI5<>(this);
+	}
+
+	@Override
+	public long getMove(T game) {
+		for (int i = 0; i < threads; i++) {
+			threadRoots[i] = findOrResetRoot(threadRoots[i], game);
+		}
+
+		final ExecutorService pool = Executors.newFixedThreadPool(threads);
+		final long endTime = System.nanoTime() + milliseconds * 1_000_000L;
+
+		final List<Callable<Node>> tasks = new ArrayList<>();
+
+		for (int i = 0; i < threads; i++) {
+			final int threadIndex = i;
+
+			tasks.add(() -> {
+				final Node localRoot = threadRoots[threadIndex];
+
+				while (System.nanoTime() < endTime) {
+					Node leaf = selection(localRoot);
+					leaf = expansion(leaf);
+					final float value = simulation(leaf);
+					backPropagation(leaf, value);
+				}
+
+				return localRoot;
+			});
+		}
+
+		try {
+			final List<Future<Node>> results = pool.invokeAll(tasks);
+
+			pool.shutdown();
+
+			final Node root = new Node(game.deepCopy());
+
+			for (int i = 0; i < root.children.length; i++) {
+				expansion(root);
+			}
+
+			for (final Future<Node> result : results) {
+				final Node localRoot = result.get();
+
+				for (final Node localChild : localRoot.children) {
+					for (int i = 0; i < root.children.length; i++) {
+						if (localChild.move == root.children[i].move) {
+							root.children[i].visits += localChild.visits;
+							root.visits += localChild.visits;
+							break;
+						}
+					}
+				}
+			}
+
+			final Node mostVisitedChild = mostVisitedChild(root);
+			final long move = mostVisitedChild.move;
+
+			for (int i = 0; i < threads; i++) {
+				threadRoots[i] = findChildByMove(threadRoots[i], move);
+			}
+
+			return move;
+		} catch (Exception _) {
+			final long legalMoves = game.getLegalMoves();
+			return randomSetBit(legalMoves);
+		}
+	}
+
+	private Node mostVisitedChild(Node root) {
+		Node mostVisitedChild = null;
+		int mostVisited = -1;
+
+		for (int i = 0; i < root.expanded; i++) {
+			if (root.children[i].visits > mostVisited) {
+				mostVisitedChild = root.children[i];
+				mostVisited = root.children[i].visits;
+			}
+		}
+
+		return mostVisitedChild;
+	}
+
+	private Node findOrResetRoot(Node root, T game) {
+		if (root == null) {
+			return new Node(game.deepCopy());
+		}
+
+		if (areStatesEqual(root.state.getBoard(), game.getBoard())) {
+			return root;
+		}
+
+		for (int i = 0; i < root.expanded; i++) {
+			if (areStatesEqual(root.children[i].state.getBoard(), game.getBoard())) {
+				root.children[i].parent = null;
+				return root.children[i];
+			}
+		}
+
+		return new Node(game.deepCopy());
+	}
+
+	private Node findChildByMove(Node root, long move) {
+		for (int i = 0; i < root.expanded; i++) {
+			if (root.children[i].move == move) {
+				root.children[i].parent = null;
+				return root.children[i];
+			}
+		}
+
+		return null;
+	}
+
+	private boolean areStatesEqual(long[] state1, long[] state2) {
+		if (state1.length != state2.length) {
+			return false;
+		}
+
+		for (int i = 0; i < state1.length; i++) {
+			if (state1[i] != state2[i]) {
+				return false;
+			}
+		}
+
+		return true;
+	}
+
+	private Node selection(Node root) {
+		while (!root.solved && root.isFullyExpanded() && !root.state.isTerminal()) {
+			root = root.bestUCTChild();
+		}
+
+		return root;
+	}
+
+	private Node expansion(Node leaf) {
+		if (leaf.unexpandedMoves == 0L) {
+			return leaf;
+		}
+
+		final long unexpandedMove = leaf.unexpandedMoves & -leaf.unexpandedMoves;
+
+		final TurnBasedGame<?> copiedState = leaf.state.deepCopy();
+		copiedState.play(unexpandedMove);
+
+		final Node expandedChild = new Node(copiedState, leaf, unexpandedMove);
+
+		leaf.children[leaf.expanded] = expandedChild;
+		leaf.expanded++;
+
+		leaf.unexpandedMoves &= ~unexpandedMove;
+
+		return expandedChild;
+	}
+
+	private float simulation(Node leaf) {
+		final TurnBasedGame<?> copiedState = leaf.state.deepCopy();
+		final int playerIndex = 1 - copiedState.getCurrentTurn();
+
+		while (!copiedState.isTerminal()) {
+			final long legalMoves = copiedState.getLegalMoves();
+
+			long move = 0L;
+
+			if (random.get().nextFloat() > 0.9f) {
+				move = copiedState.heuristicMove(legalMoves);
+			} else {
+				move = randomSetBit(legalMoves);
+			}
+
+			copiedState.play(move);
+		}
+
+		if (copiedState.getWinner() == playerIndex) {
+			return 1.0f;
+		}
+
+		if (copiedState.getWinner() >= 0) {
+			return -1.0f;
+		}
+
+		return 0.0f;
+	}
+
+	private void backPropagation(Node leaf, float value) {
+		while (leaf != null) {
+			leaf.value += value;
+			leaf.visits++;
+
+			if (!leaf.solved) {
+				updateSolvedStatus(leaf);
+			}
+
+			value = -value;
+			leaf = leaf.parent;
+		}
+	}
+
+	private void updateSolvedStatus(Node node) {
+		if (node.state.isTerminal()) {
+			node.solved = true;
+
+			final int winner = node.state.getWinner();
+			final int mover = 1 - node.state.getCurrentTurn();
+
+			node.solvedValue = winner == mover? 1.0f : winner == -1? 0.0f : -1.0f;
+
+			return;
+		}
+
+		if (node.isFullyExpanded()) {
+			boolean allChildrenSolved = true;
+			boolean foundWinningMove = false;
+			boolean foundDrawMove = false;
+
+			for (final Node child : node.children) {
+				if (child.solved) {
+					if (child.solvedValue == -1.0f) {
+						foundWinningMove = true;
+						break;
+					}
+
+					if (child.solvedValue == 0.0f) {
+						foundDrawMove = true;
+					}
+				} else {
+					allChildrenSolved = false;
+				}
+			}
+
+			if (foundWinningMove) {
+				node.solved = true;
+				node.solvedValue = 1.0f;
+			} else if (allChildrenSolved) {
+				node.solved = true;
+				node.solvedValue = foundDrawMove? 0.0f : -1.0f;
+			}
+		}
+	}
+
+	private long randomSetBit(long value) {
+		if (0L == value) {
+			return 0;
+		}
+
+		final int bitCount = Long.bitCount(value);
+		final int randomBitCount = random.get().nextInt(bitCount);
+
+		for (int i = 0; i < randomBitCount; i++) {
+			value &= value - 1;
+		}
+
+		return value & -value;
+	}
+}