debug: we should estimate our own win rate

2018-01-08 16:19:59 +08:00 · 2018-01-08 16:19:59 +08:00 · 32b7b33ed5
commit 32b7b33ed5
parent 8b7b4b6c6b
1 changed files with 1 additions and 1 deletions
--- a/AlphaGo/model.py
+++ b/AlphaGo/model.py
@ -284,7 +284,7 @@ class ResNet(object):
            history.append(board)
            states.append(self._history2state(history, color))
            probs.append(np.array(prob).reshape(1, self.board_size ** 2 + 1))
-            winner.append(np.array(data.winner).reshape(1, 1))
+            winner.append(np.array(data.winner * color).reshape(1, 1))
            color *= -1
        states = np.concatenate(states, axis=0)
        probs = np.concatenate(probs, axis=0)