changed reward to be in the range [0,1]

2011-06-29 09:39:14 +08:00 · 2011-06-29 09:39:14 +08:00 · 9c9bf47abe
parent df6a3c546a
commit 9c9bf47abe
1 changed files with 8 additions and 3 deletions
--- a/src/magic/ai/MCTSAI.java
+++ b/src/magic/ai/MCTSAI.java
@ -101,6 +101,10 @@ public class MCTSAI implements MagicAI {
               C * Math.sqrt(Math.log(parent.getNumSim()) / child.getNumSim());
    }
    private double selectMOSS(final MCTSGameTree parent, final MCTSGameTree child) {
        return 0.0;
    }
    private double selectRatio(final MCTSGameTree parent, final MCTSGameTree child) {
        return (parent.sign() * child.getScore() + 10)/(child.getNumSim() + 10);
    }
@ -362,6 +366,7 @@ public class MCTSAI implements MagicAI {
        return path;
    }
    //returns a reward in the range [0, 1]
    private double randomPlay(final MCTSGameTree node, final MagicGame game) {
        //terminal node, no need for random play
        if (game.isFinished()) {
@ -369,7 +374,7 @@ public class MCTSAI implements MagicAI {
            if (game.getLosingPlayer() == game.getScorePlayer()) {
                node.setAILose(0);
-                return -1.0;
+                return 0.0;
            } else {
                node.setAIWin(0);
                return 1.0;
@ -387,9 +392,9 @@ public class MCTSAI implements MagicAI {
        if (game.getLosingPlayer() == null) {
            return 0;
        } else if (game.getLosingPlayer() == game.getScorePlayer()) {
-            return  -(1.0 - actions/((double)MAX_ACTIONS));
+            return  actions/(2.0 * MAX_ACTIONS);
        } else {
-            return  1.0 - actions/((double)MAX_ACTIONS);
+            return  1.0 - actions/(2.0 * MAX_ACTIONS);
        }
    }