Минимаксный алгоритм Отелло / Реверси

Недавно я работал над алгоритмом MiniMax для стандартной игры 8x8 Othello (Reversi) на Android на Java. Кажется, что каждый журнал показывает правильные значения для каждого узла, и все же алгоритм почему-то просто не выбирает оптимальный ход (я сравнил поведение с чужим приложением, и в какой-то момент они различаются).

Боюсь, есть немного кода, который можно проглотить, но я верю, что вы можете сделать это!

Прежде всего, мой класс Algorithm (от этого класса я наследую алгоритм MiniMax):

public abstract class Algorithm 
{
/** game instance to which the strategy is applied */
Game game;

public Algorithm (Game game)
{
    this.game = game;
}

/**Finds player's all possible moves for the current state   * 
 * @param gb - a game board for which the moves are found
 * @param player - current player
 * @return - an array list of possible fields to move
 */
public ArrayList<Field> findAllPossibleMoves(GameBoard gb, boolean player)
{
    ArrayList <Field> moves = new ArrayList <Field> ();
    for (int y= 0; y<gb.getHeight();y++) for (int x= 0; x<gb.getWidth();x++)
    {
        Field f = new Field (x,y);
        if (game.isAvailable(gb, f, player)) moves.add(f);          
    }
    return moves;
}

/** Searches for the right move 
 * @param gb - game board to do the search on
 * @param depth maximum depth of search tree
 * @param player - current player
 * @return - optimum move (Field)
 */
public abstract Field findBestMove(GameBoard gb, int depth, boolean player);

/**Evaluates the player's current state  * 
 * @param gb - game board to be evaluated
 * @param player - player for which we evaluate
 * @return - the current rating (int)
 */ 
public int evaluate(GameBoard gb) 
{
    int rating = 0;     
    int[][] eval_table = {
            {99,  -8,  8,  6,  6,  8,  -8, 99},
            {-8, -24, -4, -3, -3, -4, -24, -8},
            { 8,  -4,  7,  4,  4,  7,  -4,  8},
            { 6,  -3,  4,  0,  0,  4,  -3,  6},
            { 6,  -3,  4,  0,  0,  4,  -3,  6},
            { 8,  -4,  7,  4,  4,  7,  -4,  8},
            {-8, -24, -4, -3, -3, -4, -24, -8},
            {99,  -8,  8,  6,  6,  8,  -8, 99}
    };
    for (int x=0; x<8; x++) for (int y=0;y<8;y++)
    {
        if(gb.board[x][y] == GameBoard.WHITE)
        {
            //rating+=eval_table[x][y];
            rating++;
        }
    }
    return rating;
}
}

Функция findBestMove, конечно, переопределяется в дочернем классе MiniMax:

@Override
public Field findBestMove(GameBoard gb, int depth, boolean player) 
{   
    /** maximum depth of search reached, we stop */
    if(depth >= max_depth) return null;

    //player = (depth+1)%2 + 1;

    /** getting a list of moves to chose from */
    ArrayList <Field> moves = findAllPossibleMoves(gb, player); 

    Field best_move = null;

    /** iterating over all possible moves, to find the best one */      
    for (int i=0; i<moves.size(); i++)
    {
        /** board to simulate moves */
        GameBoard temp_board = new GameBoard(gb);
        /** getting the current move */
        Field move = moves.get(i);      
        /** simulating the move for the current node */
        game.move(move, temp_board, player);
        Log.i("board", "Depth:"+depth+" Player:"+player+" Move:"+i+" Rating:"+evaluate(temp_board));
        Log.i("board", ""+moves.get(i).getX()+","+moves.get(i).getY());         
        temp_board.printBoard();
        /** getting to the next inferior node */            
        Field best_deep_move = findBestMove (temp_board, depth + 1, !player);           

        /** if the maximum depth is reached, we have a null, so we evaluate */
        if (best_deep_move == null) 
        {
            move.setRating(evaluate (temp_board));
        }
        /** if we are not the deepest possible, we get the rating from the lower node */
        else 
        {
            move.setRating(best_deep_move.getRating());         
            Log.i("eval", ""+best_deep_move.getRating());
        }           
        if(best_move == null) 
        {
            best_move = move;           
        }

        else
        {   
            Log.i("update", "Current move rating:"+move.getRating());
            Log.i("update", "New move rating:"+best_move.getRating());
            if (depth%2==0)
            {
                Log.i("update", "MAX player");
                /** for us, we look for the maximum */
                if (best_move.getRating() < move.getRating()) 
                    {


                    best_move = move;

                    }

            }
            else
            {
                Log.i("update", "MIN player");
                /** for the opponent, we look for the minimum */
                if (best_move.getRating() > move.getRating())
                { 


                    best_move = move;

                }
            }
            Log.i("update", "Updated move rating"+best_move.getRating());
        }
    }

    return best_move;
}

Алгоритм создан в моем текущем экземпляре Game:

public class Game {

public GameBoard game_board;
public Algorithm alg;

boolean active_player;
//int other_player;
int white_count;
int black_count;
int depth;

public Game()
{
    game_board = new GameBoard(8, 8);
    active_player = true;
    //other_player = GameBoard.WHITE;
    white_count = 0;
    black_count = 0;


    // AI strategy
    alg = new MiniMaxAlgorithm(this);
}


public boolean getActive_player() {
    return active_player;

}


public void setActive_player(boolean active_player) {
    this.active_player = active_player;
}

//public boolean getOther_player() {
    //return other_player;
//}


//public void setOther_player(boolean other_player) {
    //this.other_player = other_player;
//  }



public int getWhite_count() {
    return white_count;
}


public void setWhite_count(int white_count) {
    this.white_count = white_count;
}


public int getBlack_count() {
    return black_count;
}


public void setBlack_count(int black_count) {
    this.black_count = black_count;
}

// array of 8 possible directions
public final int[][] directions = new int [][]{
        {-1, 0},
        {-1, 1},
        {0, 1},
        {1, 1},
        {1, 0},
        {1, -1},
        {0, -1},
        {-1, -1}            
};


public int playerToPiece (boolean player)
{
    return player == true? GameBoard.BLACK : GameBoard.WHITE;
}

/** Function checking if a given field is available to move
 * 
 * @param f - field to be checked
 * @return - whether or not the field is available (boolean)
 */

public boolean isAvailable (GameBoard gb, Field f, boolean player)
{
    if(gb.board[f.x][f.y] != GameBoard.EMPTY) return false;
    /** iterating over all 8 possible directions */
    for (int k=0; k<directions.length; k++)
    {
        int dx = directions[k][0];
        int dy = directions[k][1];          
        /** scanning through all fields in line with the current direction */           
        for (int i = f.x + dx, j = f.y + dy; 
                i>=0 && i<gb.getWidth() && j>=0 && j<gb.getHeight() ; i+=dx, j+=dy)
        {
            if(i == f.x + dx && j == f.y + dy && gb.board[i][j] == playerToPiece(player)) break;
            if(gb.board[i][j] == GameBoard.EMPTY) break;
            else if(gb.board[i][j] == playerToPiece(player)) return true;
        }
    }
    return false;
}

/** Function performing a move
 * 
 * @param f - destination field of the move
 * @param board - board to do the move on
 * @param player - player that performs the move
 */

public void move (Field f, GameBoard board, boolean player)
{

    if (f == null) return;
    if (isAvailable(board, f, player))
    {
        board.board[f.x][f.y] = playerToPiece(player); 
        /** iterating over all 8 possible directions */
        for (int k=0;k < directions.length; k++)
        {
            int dx = directions[k][0];
            int dy = directions[k][1];
            /** scanning through all fields in line with the current direction */               
            for (int i = f.x + dx, j = f.y + dy; 
                    i>=0 && j>=0 && i<board.getWidth() && j<board.getHeight() ; i+=dx, j+=dy)
            {
                /** if there is an empty field, there can be no line, so we move on to the next dir */
                if(board.board[i][j] == GameBoard.EMPTY) break;
                /** if the field is the same as active, we fill all the fields up to that one with 
                 * that color  */
                else if(board.board[i][j] == playerToPiece(player))
                {
                    for (int a = f.x, b = f.y; a*dx<=i*dx && b*dy<=j*dy; a+=dx, b+=dy)
                    {
                        board.board[a][b] = playerToPiece(player);
                    }
                    break;
                }
            }
        }

        white_count = black_count = 0;
        for (int i = 0; i < board.getWidth(); i++)
        {
            for (int j=0; j < board.getHeight(); j++)
            {
                if (board.board[i][j] == GameBoard.WHITE) white_count++;
                else if (board.board[i][j] == GameBoard.BLACK) black_count++;
            }
        }
    }
}


/** Function changing the active player
 * 
 */
public void changePlayer ()
{
    active_player = !active_player;
    //active_player = active_player == GameBoard.BLACK ? GameBoard.WHITE : GameBoard.BLACK;
    //other_player = other_player == GameBoard.BLACK ? GameBoard.WHITE : GameBoard.BLACK;
}

}

Я действительно предпринял исследовательскую работу, но должен признать, что нелегко отследить и исправить ошибку с помощью повторяющейся функции, просто погуглив проблему. Это заставляет меня зацикливаться на дальнейшей оптимизации (альфа-бета и т. Д.), И мне действительно нужно ускориться сейчас.

0 ответов

Другие вопросы по тегам