In [5]:
"""
Tic Tac Toe Player using Minimax and Alpha-Beta Pruning
"""

import copy
import math
import random


X = "X"
O = "O"
EMPTY = None


def initial_state():
    """
    Returns starting state of the board.
    """
    return [[EMPTY, EMPTY, EMPTY],
            [EMPTY, EMPTY, EMPTY],
            [EMPTY, EMPTY, EMPTY]]


def player(board):
    """
    Returns player who has the next turn on a board.
    """
    count = 0
    for i in board:
        for j in i:
            if j:
                count += 1
    if count % 2 != 0:
        return O
    return X


def actions(board):
    """
    Returns set of all possible actions (i, j) available on the board.
    """
    res = set()
    board_len = len(board)
    for i in range(board_len):
        for j in range(board_len):
            if board[i][j] == EMPTY:
                res.add((i, j))
    return res


def result(board, action):
    """
    Returns the board that results from making move (i, j) on the board.
    """
    curr_player = player(board)
    result_board = copy.deepcopy(board)
    (i, j) = action
    result_board[i][j] = curr_player
    return result_board


def get_horizontal_winner(board):
    # check horizontally
    winner_val = None
    board_len = len(board)
    for i in range(board_len):
        winner_val = board[i][0]
        for j in range(board_len):
            if board[i][j] != winner_val:
                winner_val = None
        if winner_val:
            return winner_val
    return winner_val


def get_vertical_winner(board):
    # check vertically
    winner_val = None
    board_len = len(board)
    for i in range(board_len):
        winner_val = board[0][i]
        for j in range(board_len):
            if board[j][i] != winner_val:
                winner_val = None
        if winner_val:
            return winner_val
    return winner_val


def get_diagonal_winner(board):
    # check diagonally
    winner_val = None
    board_len = len(board)
    winner_val = board[0][0]
    for i in range(board_len):
        if board[i][i] != winner_val:
            winner_val = None
    if winner_val:
        return winner_val

    winner_val = board[0][board_len - 1]
    for i in range(board_len):
        j = board_len - 1 - i
        if board[i][j] != winner_val:
            winner_val = None

    return winner_val


def winner(board):
    """
    Returns the winner of the game, if there is one.
    """
    winner_val = get_horizontal_winner(board) or get_vertical_winner(board) or get_diagonal_winner(board) or None
    return winner_val


def terminal(board):
    """
    Returns True if game is over, False otherwise.
    """
    if winner(board) != None:
        return True

    for i in board:
        for j in i:
            if j == EMPTY:
                return False
    return True

def utility(board):
    """
    Returns 1 if X has won the game, -1 if O has won, 0 otherwise.
    """
    winner_val = winner(board)
    if winner_val == X:
        return 1
    elif winner_val == O:
        return -1
    return 0

# For Minimax without pruning
# def max_val(board):
#     # get max-value
#     if terminal(board):
#         return utility(board)
#     v = -math.inf
#     for action in actions(board):
#         v = max(v, min_val(result(board, action)))
#     return v


# def min_val(board):
#     # get min-value
#     if terminal(board):
#         return utility(board)
#     v = math.inf
#     for action in actions(board):
#         v = min(v, max_val(result(board, action)))
#     return v

# For Alpha Beta Pruning
def max_val(board,alpha,beta):
    # get max-value
    if terminal(board):
        return utility(board)
    v = -math.inf
    for action in actions(board):
        min_val_op = min_val(result(board, action),alpha,beta)
        # print(f"min_val_op {min_val_op} in action {action} with alpha {alpha} and beta {beta}")
        if alpha < beta:
            v = max(v, min_val_op)
            if alpha < v:
                alpha =v
    return v


def min_val(board,alpha,beta):
    # get min-value
    if terminal(board):
        return utility(board)
    v = math.inf
    for action in actions(board):
        max_val_op = max_val(result(board, action),alpha,beta)
        # print(f"max_val_op {max_val_op} in action {action} with alpha {alpha} and beta {beta}")
        if alpha < beta:
            v = min(v, max_val_op)
            if beta > v:
                beta = v
    return v


In [6]:
def minimax(board):
    """
    Returns the optimal action for the current player on the board.
    """
    
    if board == initial_state():
        return (random.randint(0, 2), random.randint(0, 2))
    curr_player = player(board)
    action_to_return = None
    if curr_player == X:
        val = -math.inf
        for action in actions(board):
            min_val_result = min_val(result(board, action))
            if val < min_val_result:
                val = min_val_result
                action_to_return = action
    elif curr_player == O:
        val = math.inf
        for action in actions(board):
            max_val_result = max_val(result(board, action))
            if val > max_val_result:
                val = max_val_result
                action_to_return = action
    return action_to_return

In [7]:
def alpha_beta_pruining(board):
    """
    Returns the optimal action for the current player on the board.
    """
    alpha = math.inf
    beta = -math.inf
    
    if board == initial_state():
        return (random.randint(0, 2), random.randint(0, 2))
    curr_player = player(board)
    action_to_return = None
    if curr_player == X:
        val = -math.inf
        for action in actions(board):
            if alpha >= beta:
                min_val_result = min_val(result(board, action),alpha,beta)
                if val < min_val_result:
                    val = min_val_result
                    action_to_return = action
                if val < beta:
                    beta = val
    elif curr_player == O:
        val = math.inf
        for action in actions(board):
            if alpha >= beta:
                max_val_result = max_val(result(board, action),alpha,beta)
                if val > max_val_result:
                    val = max_val_result
                    action_to_return = action
                if val > alpha:
                    alpha = val
    return action_to_return

In [8]:

if __name__ == "__main__":
    user = None
    board = initial_state()
    ai_turn = False
    print("Choose a player")
    user=input()
    while True:
        game_over =terminal(board)
        playr = player(board)
        if game_over:
            winner = winner(board)
            if winner is None:
                print("Game Over: Tie.")
            else:
                print(f"Game Over: {winner} wins.")
            break;
    
        else:
            
            if user != playr and not game_over:
                 if ai_turn:
                        # here we can select minimax or alpha_beta_pruining to play
                        move = alpha_beta_pruining(board)
                        board = result(board, move)
                        print(f'Move {move} and Board after AI move: {board}')
                        ai_turn = False
                        print(board)
            
             
            elif user == playr and not game_over:
            
                ai_turn = True
                print("Enter the position to move (row,col)")
                i=int(input("Row:"))
                j=int(input("Col:"))
                
                if board[i][j] == EMPTY:
                    board = result(board, (i, j))
                    print(board)
    

Choose a player
Enter the position to move (row,col)
[['X', None, None], [None, None, None], [None, None, None]]
Move (0, 1) and Board after AI move: [['X', 'O', None], [None, None, None], [None, None, None]]
[['X', 'O', None], [None, None, None], [None, None, None]]
Enter the position to move (row,col)
[['X', 'O', None], ['X', None, None], [None, None, None]]
Move (1, 2) and Board after AI move: [['X', 'O', None], ['X', None, 'O'], [None, None, None]]
[['X', 'O', None], ['X', None, 'O'], [None, None, None]]
Enter the position to move (row,col)
[['X', 'O', None], ['X', None, 'O'], ['X', None, None]]
Game Over: X wins.
