merge

2017-12-22 17:17:50 +08:00 · 2017-12-22 17:17:50 +08:00 · 5b044c9a0c
commit 5b044c9a0c
parent d8c0eae6a3 51b8e7fc18
3 changed files with 61 additions and 276 deletions
--- a/AlphaGo/go.py
+++ b/AlphaGo/go.py
@ -308,3 +308,42 @@ class Go:

        return score

+if __name__ == "__main__":
+    ### do unit test for Go class
+    pure_test = [
+        0, 1, 0, 1, 0, 1, 0, 0, 0,
+        1, 0, 1, 0, 1, 0, 0, 0, 0,
+        0, 1, 0, 1, 0, 0, 1, 0, 0,
+        0, 0, 1, 0, 0, 1, 0, 1, 0,
+        0, 0, 0, 0, 0, 1, 1, 1, 0,
+        1, 1, 1, 0, 0, 0, 0, 0, 0,
+        1, 0, 1, 0, 0, 1, 1, 0, 0,
+        1, 1, 1, 0, 1, 0, 1, 0, 0,
+        0, 0, 0, 0, 1, 1, 1, 0, 0
+    ]
+
+    pt_qry = [(1, 1), (1, 5), (3, 3), (4, 7), (7, 2), (8, 6)]
+    pt_ans = [True, True, True, True, True, True]
+
+    opponent_test = [
+        0, 1, 0, 1, 0, 1, 0,-1, 1,
+        1,-1, 0,-1, 1,-1, 0, 1, 0,
+        0, 0, 0, 0, 0, 0, 0, 0, 1,
+        1, 1,-1, 0, 1,-1, 1, 0, 0,
+        1, 0, 1, 0, 1, 0, 1, 0, 0,
+        -1,1, 1, 0, 1, 1, 1, 0, 0,
+        0, 1,-1, 0,-1,-1,-1, 0, 0,
+        1, 0, 1, 0,-1, 0,-1, 0, 0,
+        0, 1, 0, 0,-1,-1,-1, 0, 0
+    ]
+    ot_qry = [(1, 1), (1, 5), (2, 9), (5, 2), (5, 6), (8, 6), (8, 2)]
+    ot_ans = [False, False, False, False, False, False, True]
+
+    go = Go(size=9, komi=3.75)
+    for i in range(6):
+        print (go._is_eye(pure_test, utils.BLACK, pt_qry[i]))
+    print("Test of pure eye\n")
+
+    for i in range(7):
+        print (go._is_eye(opponent_test, utils.BLACK, ot_qry[i]))
+    print("Test of eye surrend by opponents\n")
--- a/AlphaGo/reversi.py
+++ b/AlphaGo/reversi.py
@ -34,7 +34,6 @@ def calc_flip(pos, own, enemy):
    :param enemy: bitboard
    :return: flip stones of enemy when I place stone at pos.
    """
-    assert 0 <= pos <= 63, f"pos={pos}"
    f1 = _calc_flip_half(pos, own, enemy)
    f2 = _calc_flip_half(63 - pos, rotate180(own), rotate180(enemy))
    return f1 | rotate180(f2)
@ -125,7 +124,14 @@ class Reversi:
        self.board = None  # 8 * 8 board with 1 for black, -1 for white and 0 for blank
        self.color = None  # 1 for black and -1 for white
        self.action = None   # number in 0~63
-        self.winner = None
+        # self.winner = None
+        self.black_win = None
+
+    def get_board(self, black=None, white=None):
+        self.black = black or (0b00001000 << 24 | 0b00010000 << 32)
+        self.white = white or (0b00010000 << 24 | 0b00001000 << 32)
+        self.board = self.bitboard2board() 	
+        return self.board

    def simulate_is_valid(self, board, color):
        self.board = board
@ -134,18 +140,19 @@ class Reversi:
        own, enemy = self.get_own_and_enemy()
        mobility = find_correct_moves(own, enemy)
        valid_moves = bit_to_array(mobility, 64)
+        valid_moves = np.argwhere(valid_moves)
        valid_moves = list(np.reshape(valid_moves, len(valid_moves)))
        return valid_moves

-    def simulate_step_forward(self, board, color, vertex):
-        self.board = board
-        self.color = color
+    def simulate_step_forward(self, state, vertex):
+        self.board = state[0]
+        self.color = state[1]
        self.board2bitboard()
        self.vertex2action(vertex)
        step_forward = self.step()
        if step_forward:
            new_board = self.bitboard2board()
-            return new_board
+            return [new_board, 0 - self.color], 0

    def executor_do_move(self, board, color, vertex):
        self.board = board
@ -155,13 +162,14 @@ class Reversi:
        step_forward = self.step()
        if step_forward:
            new_board = self.bitboard2board()
-            return new_board
+        for i in range(64):
+        	board[i] = new_board[i]

    def executor_get_score(self, board):
        self.board = board
        self._game_over()
-        if self.winner is not None:
-            return self.winner, 0 - self.winner
+        if self.black_win is not None:
+            return self.black_win
        else:
            ValueError("Game not finished!")

@ -219,6 +227,7 @@ class Reversi:

    def _game_over(self):
        # self.done = True
+        '''
        if self.winner is None:
            black_num, white_num = self.number_of_black_and_white
            if black_num > white_num:
@ -227,9 +236,12 @@ class Reversi:
                self.winner = -1
            else:
                self.winner = 0
+        '''
+        if self.black_win is None:
+        	black_num, white_num = self.number_of_black_and_white
+        	self.black_win = black_num - white_num

    def illegal_move_to_lose(self, action):
-        logger.warning(f"Illegal action={action}, No Flipped!")
        self._game_over()

    def get_own_and_enemy(self):
--- a/AlphaGo/unit_test.py
+++ b/AlphaGo/unit_test.py
@ -1,266 +0,0 @@
-import numpy as np
-import sys
-from game import Game
-from engine import GTPEngine
-import utils
-import time
-import copy
-import network_small
-import tensorflow as tf
-from collections import deque
-from tianshou.core.mcts.mcts import MCTS
-
-DELTA = [[1, 0], [-1, 0], [0, -1], [0, 1]]
-CORNER_OFFSET = [[-1, -1], [-1, 1], [1, 1], [1, -1]]
-
-class GoEnv:
-    def __init__(self, size=9, komi=6.5):
-        self.size = size
-        self.komi = komi
-        self.board = [utils.EMPTY] * (self.size * self.size)
-        self.history = deque(maxlen=8)
-
-    def _set_board(self, board):
-        self.board = board
-
-    def _flatten(self, vertex):
-        x, y = vertex
-        return (x - 1) * self.size + (y - 1)
-
-    def _bfs(self, vertex, color, block, status, alive_break):
-        block.append(vertex)
-        status[self._flatten(vertex)] = True
-        nei = self._neighbor(vertex)
-        for n in nei:
-            if not status[self._flatten(n)]:
-                if self.board[self._flatten(n)] == color:
-                    self._bfs(n, color, block, status, alive_break)
-
-    def _find_block(self, vertex, alive_break=False):
-        block = []
-        status = [False] * (self.size * self.size)
-        color = self.board[self._flatten(vertex)]
-        self._bfs(vertex, color, block, status, alive_break)
-
-        for b in block:
-            for n in self._neighbor(b):
-                if self.board[self._flatten(n)] == utils.EMPTY:
-                    return False, block
-        return True, block
-
-    def _is_qi(self, color, vertex):
-        nei = self._neighbor(vertex)
-        for n in nei:
-            if self.board[self._flatten(n)] == utils.EMPTY:
-                return True
-
-        self.board[self._flatten(vertex)] = color
-        for n in nei:
-            if self.board[self._flatten(n)] == utils.another_color(color):
-                can_kill, block = self._find_block(n)
-                if can_kill:
-                    self.board[self._flatten(vertex)] = utils.EMPTY
-                    return True
-
-        ### avoid suicide
-        can_kill, block = self._find_block(vertex)
-        if can_kill:
-            self.board[self._flatten(vertex)] = utils.EMPTY
-            return False
-
-        self.board[self._flatten(vertex)] = utils.EMPTY
-        return True
-
-    def _check_global_isomorphous(self, color, vertex):
-        ##backup
-        _board = copy.copy(self.board)
-        self.board[self._flatten(vertex)] = color
-        self._process_board(color, vertex)
-        if self.board in self.history:
-            res = True
-        else:
-            res = False
-
-        self.board = _board
-        return res
-
-    def _in_board(self, vertex):
-        x, y = vertex
-        if x < 1 or x > self.size: return False
-        if y < 1 or y > self.size: return False
-        return True
-
-    def _neighbor(self, vertex):
-        x, y = vertex
-        nei = []
-        for d in DELTA:
-            _x = x + d[0]
-            _y = y + d[1]
-            if self._in_board((_x, _y)):
-                nei.append((_x, _y))
-        return nei
-
-    def _corner(self, vertex):
-        x, y = vertex
-        corner = []
-        for d in CORNER_OFFSET:
-            _x = x + d[0]
-            _y = y + d[1]
-            if self._in_board((_x, _y)):
-                corner.append((_x, _y))
-        return corner
-
-    def _process_board(self, color, vertex):
-        nei = self._neighbor(vertex)
-        for n in nei:
-            if self.board[self._flatten(n)] == utils.another_color(color):
-                can_kill, block = self._find_block(n, alive_break=True)
-                if can_kill:
-                    for b in block:
-                        self.board[self._flatten(b)] = utils.EMPTY
-
-    def _find_group(self, start):
-        color = self.board[self._flatten(start)]
-        #print ("color : ", color)
-        chain = set()
-        frontier = [start]
-        while frontier:
-            current = frontier.pop()
-            #print ("current : ", current)
-            chain.add(current)
-            for n in self._neighbor(current):
-                #print n, self._flatten(n), self.board[self._flatten(n)],
-                if self.board[self._flatten(n)] == color and not n in chain:
-                    frontier.append(n)
-        return chain
-
-    def _is_eye(self, color, vertex):
-        nei = self._neighbor(vertex)
-        cor = self._corner(vertex)
-        ncolor = {color == self.board[self._flatten(n)] for n in nei}
-        if False in ncolor:
-            #print "not all neighbors are in same color with us"
-            return False
-        if set(nei) < self._find_group(nei[0]):
-            #print "all neighbors are in same group and same color with us"
-            return True
-        else:
-            opponent_number = [self.board[self._flatten(c)] for c in cor].count(-color)
-            opponent_propotion = float(opponent_number) / float(len(cor))
-            if opponent_propotion < 0.5:
-                #print "few opponents, real eye"
-                return True
-            else:
-                #print "many opponents, fake eye"
-                return False
-
-    # def is_valid(self, color, vertex):
-    def is_valid(self, state, action):
-        # state is the play board, the shape is [1, 9, 9, 17]
-        if action == self.size * self.size:
-            vertex = (0, 0)
-        else:
-            vertex = (action / self.size + 1, action % self.size + 1)
-        if state[0, 0, 0, -1] == utils.BLACK:
-            color = utils.BLACK
-        else:
-            color = utils.WHITE
-        self.history.clear()
-        for i in range(8):
-            self.history.append((state[:, :, :, i] - state[:, :, :, i + 8]).reshape(-1).tolist())
-        self.board = copy.copy(self.history[-1])
-        ### in board
-        if not self._in_board(vertex):
-            return False
-
-        ### already have stone
-        if not self.board[self._flatten(vertex)] == utils.EMPTY:
-            # print(np.array(self.board).reshape(9, 9))
-            # print(vertex)
-            return False
-
-        ### check if it is qi
-        if not self._is_qi(color, vertex):
-            return False
-
-        ### check if it is an eye of yourself
-        ### assumptions : notice that this judgement requires that the state is an endgame
-        #if self._is_eye(color, vertex):
-        #    return False
-
-        if self._check_global_isomorphous(color, vertex):
-            return False
-
-        return True
-
-    def do_move(self, color, vertex):
-        if vertex == utils.PASS:
-            return True
-
-        id_ = self._flatten(vertex)
-        if self.board[id_] == utils.EMPTY:
-            self.board[id_] = color
-            self.history.append(copy.copy(self.board))
-            return True
-        else:
-            return False
-
-    def step_forward(self, state, action):
-        if state[0, 0, 0, -1] == 1:
-            color = 1
-        else:
-            color = -1
-        if action == 81:
-            vertex = (0, 0)
-        else:
-            vertex = (action % 9 + 1, action / 9 + 1)
-        # print(vertex)
-        # print(self.board)
-        self.board = (state[:, :, :, 7] - state[:, :, :, 15]).reshape(-1).tolist()
-        self.do_move(color, vertex)
-        new_state = np.concatenate(
-            [state[:, :, :, 1:8], (np.array(self.board) == 1).reshape(1, 9, 9, 1),
-             state[:, :, :, 9:16], (np.array(self.board) == -1).reshape(1, 9, 9, 1),
-             np.array(1 - state[:, :, :, -1]).reshape(1, 9, 9, 1)],
-            axis=3)
-        return new_state, 0
-
-
-pure_test = [
-    0, 1, 0, 1, 0, 1, 0, 0, 0,
-    1, 0, 1, 0, 1, 0, 0, 0, 0,
-    0, 1, 0, 1, 0, 0, 1, 0, 0,
-    0, 0, 1, 0, 0, 1, 0, 1, 0,
-    0, 0, 0, 0, 0, 1, 1, 1, 0,
-    1, 1, 1, 0, 0, 0, 0, 0, 0,
-    1, 0, 1, 0, 0, 1, 1, 0, 0,
-    1, 1, 1, 0, 1, 0, 1, 0, 0,
-    0, 0, 0, 0, 1, 1, 1, 0, 0
-]
-
-pt_qry = [(1, 1), (1, 5), (3, 3), (4, 7), (7, 2), (8, 6)]
-pt_ans = [True, True, True, True, True, True]
-
-opponent_test = [
-    0, 1, 0, 1, 0, 1, 0,-1, 1,
-    1,-1, 0,-1, 1,-1, 0, 1, 0,
-    0, 0, 0, 0, 0, 0, 0, 0, 1,
-    1, 1,-1, 0, 1,-1, 1, 0, 0,
-    1, 0, 1, 0, 1, 0, 1, 0, 0,
-   -1, 1, 1, 0, 1, 1, 1, 0, 0,
-    0, 1,-1, 0,-1,-1,-1, 0, 0,
-    1, 0, 1, 0,-1, 0,-1, 0, 0,
-    0, 1, 0, 0,-1,-1,-1, 0, 0
-]
-ot_qry = [(1, 1), (1, 5), (2, 9), (5, 2), (5, 6), (8, 2), (8, 6)]
-ot_ans = [False, False, False, False, False, True, False]
-
-#print (ge._find_group((6, 1)))
-#print ge._is_eye(utils.BLACK, pt_qry[0])
-ge = GoEnv()
-ge._set_board(pure_test)
-for i in range(6):
-    print (ge._is_eye(utils.BLACK, pt_qry[i]))
-ge._set_board(opponent_test)
-for i in range(7):
-    print (ge._is_eye(utils.BLACK, ot_qry[i]))