Source code for gomoku

import numpy as np
from mcts import State
from numba import jit
from numba import int8

__version__ = "1.0.0"
__author__ = "Przemysław Klęsk"
__email__ = "pklesk@zut.edu.pl" 


[docs]
class Gomoku(State):
    """
    Class for states of Gomoku game.
    
    Attributes:
        M (int): 
            number of rows in the board, defaults to ``15``.            
        N (int): 
            number of columns in the board, defaults to ``15``.
        SYMBOLS (List):
            list of strings representing stone symbols (black, white) or ``"."`` for empty cell. 
    """        
    
    M = 15
    N = 15
    SYMBOLS = ["\u25CB", "+", "\u25CF"] # or: [['O', '+', 'X']
    

[docs]
    def __init__(self, parent=None):
        super().__init__(parent)
        if self.parent:
            self.board = np.copy(self.parent.board)
        else:
            self.board = np.zeros((Gomoku.M, Gomoku.N), dtype=np.int8)

    

[docs]
    @staticmethod
    def class_repr():
        """        
        Returns a string representation of class ``Gomoku`` (meant to instantiate states of Gomoku game), informing about the size of board.
        
        Returns:
            str: string representation of class ``Gomoku`` (meant to instantiate states of Gomoku game), informing about the size of board. 
        """        
        return f"{Gomoku.__name__}_{Gomoku.M}x{Gomoku.N}"    

            

[docs]
    def __str__(self):
        """        
        Returns a string representation of this ``Gomoku`` state - the contents of its game board.
        
        Returns:
            str: string representation of this ``Gomoku`` state - the contents of its game board.
        """                
        s = "  "
        for j in range(Gomoku.N):
            s += f"{chr(j + ord('A'))}"
        s += "\n"
        for i in range(Gomoku.M, 0, -1):
            s += str(i).rjust(2)
            for j in range(Gomoku.N):
                s += Gomoku.SYMBOLS[self.board[i - 1, j] + 1]
            s += str(i).ljust(2)
            s += "\n"
        s += "  "
        for j in range(Gomoku.N):
            s += f"{chr(j + ord('A'))}"
        return s         

    

[docs]
    def take_action_job(self, action_index):
        """
        Places a stone onto the crossing of the board indicated by the action_index (row: ``action_index // Gomoku.N``, column: ``action_index % Gomoku.N``) 
        and returns ``True`` if the action is legal (crossing was not occupied).
        Otherwise, does no changes and returns ``False``.

        Args:
            action_index (int): 
                index of crossing where to place a stone.
        
        Returns:
            action_legal (bool):
                boolean flag indicating if the specified action was legal and performed.
        """        
        i = action_index // Gomoku.N
        j = action_index % Gomoku.N
        if i < 0 or i >= Gomoku.M or j < 0 or j >= Gomoku.N:
            return False
        if self.board[i, j] != 0:
            return False
        self.board[i, j] = self.turn
        self.turn *= -1
        return True

    

[docs]
    def compute_outcome_job(self):
        """        
        Computes and returns the game outcome for this state in compliance with rules of Gomoku game: 
        {-1, 1} denoting a win for the minimizing or maximizing player, respectively, if he connected exactly 5 his stones (6 or more do not count for a win); 
        0 denoting a tie, when the board is filled and no line of 5 exists; 
        ``None`` when the game is ongoing.
        
        Returns:
            outcome ({-1, 0, 1} or ``None``)
                game outcome for this state.
        """        
        i = self.last_action_index // Gomoku.N
        j = self.last_action_index % Gomoku.N
        if True: # a bit faster outcome via numba
            numba_outcome = Gomoku.compute_outcome_job_numba_jit(Gomoku.M, Gomoku.N, self.turn, i, j, self.board)
            if numba_outcome != 0:
                return numba_outcome 
        else:
            last_token = -self.turn        
            # N-S
            total = 0
            for k in range(1, 6):
                if i -  k < 0 or self.board[i - k, j] != last_token:
                    break
                total += 1
            for k in range(1, 6):
                if i + k >= Gomoku.M or self.board[i + k, j] != last_token:
                    break            
                total += 1
            if total == 4:
                return last_token                        
            # E-W
            total = 0
            for k in range(1, 6):
                if j + k >= Gomoku.N or self.board[i, j + k] != last_token:
                    break
                total += 1
            for k in range(1, 6):
                if j - k < 0 or self.board[i, j - k] != last_token:
                    break            
                total += 1
            if total == 4:
                return last_token            
            # NE-SW
            total = 0
            for k in range(1, 6):
                if i - k < 0 or j + k >= Gomoku.N or self.board[i - k, j + k] != last_token:
                    break
                total += 1
            for k in range(1, 6):
                if i + k >= Gomoku.M or j - k < 0 or self.board[i + k, j - k] != last_token:
                    break
                total += 1            
            if total == 4:
                return last_token            
            # NW-SE
            total = 0
            for k in range(1, 6):
                if i - k < 0 or j - k < 0 or self.board[i - k, j - k] != last_token:
                    break
                total += 1
            for k in range(1, 6):
                if i + k >= Gomoku.M or j + k >= Gomoku.N or self.board[i + k, j + k] != last_token:
                    break
                total += 1            
            if total == 4:
                return last_token                                    
        if np.sum(self.board == 0) == 0: # draw
            return 0
        return None        



[docs]
    @staticmethod
    @jit(int8(int8, int8, int8, int8, int8, int8[:, :]), nopython=True, cache=True)  
    def compute_outcome_job_numba_jit(M, N, turn, last_i, last_j, board):
        """Called by ``compute_outcome_job`` for faster outcomes."""
        last_token = -turn        
        i, j = last_i, last_j
        # N-S
        total = 0
        for k in range(1, 6):
            if i - k < 0 or board[i - k, j] != last_token:
                break
            total += 1
        for k in range(1, 6):
            if i + k >= M or board[i + k, j] != last_token:
                break            
            total += 1
        if total == 4:
            return last_token        
        # E-W
        total = 0
        for k in range(1, 6):
            if j + k >= N or board[i, j + k] != last_token:
                break
            total += 1
        for k in range(1, 6):
            if j - k < 0 or board[i, j - k] != last_token:
                break            
            total += 1
        if total == 4:
            return last_token
        # NE-SW
        total = 0
        for k in range(1, 6):
            if i - k < 0 or j + k >= N or board[i - k, j + k] != last_token:
                break
            total += 1
        for k in range(1, 6):
            if i + k >= M or j - k < 0 or board[i + k, j - k] != last_token:
                break
            total += 1            
        if total == 4:
            return last_token
        # NW-SE
        total = 0
        for k in range(1, 6):
            if i - k < 0 or j - k < 0 or board[i - k, j - k] != last_token:
                break
            total += 1
        for k in range(1, 6):
            if i + k >= M or j + k >= N or board[i + k, j + k] != last_token:
                break
            total += 1            
        if total == 4:
            return last_token        
        return 0        

                            

[docs]
    def take_random_action_playout(self):
        """        
        Picks a uniformly random action from actions available in this state and returns the result of calling ``take_action`` with the action index as argument.
        
        Returns:
            child (State): 
                result of ``take_action`` call for the random action.          
        """        
        indexes = np.where(np.ravel(self.board) == 0)[0]
        action_index = np.random.choice(indexes) 
        child = self.take_action(action_index)
        return child    

    

[docs]
    def get_board(self):
        """                
        Returns the board of this state (a two-dimensional array of bytes).
        
        Returns:
            board (ndarray[np.int8, ndim=2]):
                board of this state (a two-dimensional array of bytes).
        """        
        return self.board

    

[docs]
    def get_extra_info(self):
        return None

   

[docs]
    @staticmethod
    def action_name_to_index(action_name):
        """        
        Returns an action's index (numbering from 0) based on its name. E.g., name ``"B4"`` for 15 x 15 Gomoku maps to index ``18``.
        
        Args:
            action_name (str):
                name of an action.
        Returns:
            action_index (int):
                index corresponding to the given name.   
        """        
        letter = action_name.upper()[0]
        j = ord(letter) - ord('A')
        i = int(action_name[1:]) - 1
        return i * Gomoku.N + j



[docs]
    @staticmethod
    def action_index_to_name(action_index):
        """        
        Returns an action's name based on its index (numbering from 0). E.g., index ``18`` for 15 x 15 Gomoku maps to name ``"B4"``.
        
        Args:
            action_index (int):
                index of an action.
        Returns:
            action_name (str):
                name corresponding to the given index.          
        """        
        i = action_index // Gomoku.N
        j = action_index % Gomoku.N
        return f"{chr(ord('A') + j)}{i + 1}"

   

[docs]
    @staticmethod
    def get_board_shape():
        """
        Returns a tuple with shape of boards for Gomoku game.
        
        Returns:
            shape (tuple(int, int)):
                shape of boards related to states of this class.
        """        
        return (Gomoku.M, Gomoku.N)



[docs]
    @staticmethod
    def get_extra_info_memory():
        """        
        Returns amount of memory (in bytes) needed to memorize additional information associated with Gomoku states - currently 0 (no such information).
        
        Returns:
            extra_info_memory (int):
                number of bytes required to memorize additional information associated with Gomoku states.
        """        
        return 0



[docs]
    @staticmethod
    def get_max_actions():
        """
        Returns the maximum number of actions (the largest branching factor) equal to the product: ``Gomoku.M * Gomoku.N``.
        
        Returns:
            max_actions (int):
                maximum number of actions (the largest branching factor) equal to the product: ``Gomoku.M * Gomoku.N``.
        """                        
        return Gomoku.M * Gomoku.N