debug: we should estimate our own win rate
This commit is contained in:
parent
8b7b4b6c6b
commit
32b7b33ed5
@ -284,7 +284,7 @@ class ResNet(object):
|
|||||||
history.append(board)
|
history.append(board)
|
||||||
states.append(self._history2state(history, color))
|
states.append(self._history2state(history, color))
|
||||||
probs.append(np.array(prob).reshape(1, self.board_size ** 2 + 1))
|
probs.append(np.array(prob).reshape(1, self.board_size ** 2 + 1))
|
||||||
winner.append(np.array(data.winner).reshape(1, 1))
|
winner.append(np.array(data.winner * color).reshape(1, 1))
|
||||||
color *= -1
|
color *= -1
|
||||||
states = np.concatenate(states, axis=0)
|
states = np.concatenate(states, axis=0)
|
||||||
probs = np.concatenate(probs, axis=0)
|
probs = np.concatenate(probs, axis=0)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user