debug for reversi
This commit is contained in:
parent
08b6649fea
commit
b699258e76
@ -123,7 +123,7 @@ class Game:
|
|||||||
sys.stdout.flush()
|
sys.stdout.flush()
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
game = Game(name="go", checkpoint_path="./checkpoint")
|
game = Game(name="reversi", checkpoint_path=None)
|
||||||
game.debug = True
|
game.debug = True
|
||||||
game.think_play_move(utils.BLACK)
|
game.think_play_move(utils.BLACK)
|
||||||
|
|
||||||
|
@ -18,12 +18,11 @@ class Player(object):
|
|||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
parser = argparse.ArgumentParser()
|
parser = argparse.ArgumentParser()
|
||||||
parser.add_argument("--checkpoint_path", type=str, default=None)
|
parser.add_argument("--checkpoint_path", type=str, default="None")
|
||||||
parser.add_argument("--role", type=str, default="unknown")
|
parser.add_argument("--role", type=str, default="unknown")
|
||||||
parser.add_argument("--debug", type=str, default=False)
|
parser.add_argument("--debug", type=str, default="False")
|
||||||
parser.add_argument("--game", type=str, default=False)
|
parser.add_argument("--game", type=str, default="go")
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
|
||||||
if args.checkpoint_path == 'None':
|
if args.checkpoint_path == 'None':
|
||||||
args.checkpoint_path = None
|
args.checkpoint_path = None
|
||||||
game = Game(name=args.game, role=args.role,
|
game = Game(name=args.game, role=args.role,
|
||||||
|
@ -99,7 +99,7 @@ class Reversi:
|
|||||||
|
|
||||||
def simulate_hashable_conversion(self, state):
|
def simulate_hashable_conversion(self, state):
|
||||||
# since go is MDP, we only need the last board for hashing
|
# since go is MDP, we only need the last board for hashing
|
||||||
return tuple(state[0][-1])
|
return tuple(state[0][-1].flatten().tolist())
|
||||||
|
|
||||||
def _get_winner(self, board):
|
def _get_winner(self, board):
|
||||||
black_num, white_num = self._number_of_black_and_white(board)
|
black_num, white_num = self._number_of_black_and_white(board)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user