From 0ab38743aa054083410ca8e6d6f80f9018a8f1d4 Mon Sep 17 00:00:00 2001 From: Wenbo Hu Date: Wed, 20 Dec 2017 21:52:30 +0800 Subject: [PATCH] minor revision. --- AlphaGo/go.py | 3 +-- tianshou/core/mcts/mcts.py | 1 + 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/AlphaGo/go.py b/AlphaGo/go.py index 009d369..cbbe07c 100644 --- a/AlphaGo/go.py +++ b/AlphaGo/go.py @@ -180,7 +180,6 @@ class Go: if not self._knowledge_prunning(current_board, color, vertex): return False - return True def simulate_is_valid_list(self, state, action_set): @@ -188,7 +187,7 @@ class Go: ## if no action is valid, then pass valid_action_list = [] for action_candidate in action_set: - if self.simulate_is_valid(state, action_candidate): + if not self.simulate_is_valid(state, action_candidate): valid_action_list.append(action_candidate) if not valid_action_list: valid_action_list.append(utils.PASS) diff --git a/tianshou/core/mcts/mcts.py b/tianshou/core/mcts/mcts.py index c14496d..5aca06a 100644 --- a/tianshou/core/mcts/mcts.py +++ b/tianshou/core/mcts/mcts.py @@ -71,6 +71,7 @@ class UCTNode(MCTSNode): self.parent.backpropagation(self.children[action].reward) def valid_mask(self, simulator): + # let all invalid actions illeagel in mcts if self.mask is None: self.mask = simulator.simulate_is_valid_list(self.state, range(self.action_num - 1)) self.ucb[self.mask] = -float("Inf")