In [6]:

import logging
from collections import namedtuple
import random
from copy import deepcopy
from itertools import accumulate
from operator import xor


Nimply = namedtuple("Nimply", "row, num_objects")

class Nim:
    def __init__(self, num_rows: int, k: int = None):
        self._rows = [i * 2 + 1 for i in range(num_rows)]
        #self._rows = [0,1,3]
        self._k = k

    def __bool__(self):
        return sum(self._rows) > 0

    def __str__(self):
        return "<" + " ".join(str(_) for _ in self._rows) + ">"

    @property
    def rows(self) -> tuple:
        return tuple(self._rows)

    @property
    def k(self):
        return self._k
    
    #apply the chosen move by removing num_objects from the row
    def nimming(self, ply: Nimply):
        row, num_objects = ply
        assert self._rows[row] >= num_objects
        assert self._k is None or num_objects <= self._k
        self._rows[row] -= num_objects

In [7]:
def dumb_PCI(state: Nim):
    """Pick always the minimum(maximum) possible number of the lowest row"""
    possible_moves = [(r, o) for r, c in enumerate(state.rows) for o in range(1, c + 1)]
    return Nimply(*max(possible_moves, key=lambda m: (-m[0], -m[1])))

def pure_random(state: Nim):
    row = random.choice([r for r, c in enumerate(state.rows) if c > 0])
    num_objects = random.randint(1, state.rows[row])
    return Nimply(row, num_objects)

"""optimal strategy"""
def nim_sum(state: Nim):
    *_, result = accumulate(state.rows, xor)
    return result

def cook_status(state: Nim):
    cooked = dict()
    cooked["possible_moves"] = [
        (r, o) for r, c in enumerate(state.rows) for o in range(1, c + 1) if state.k is None or o <= state.k
    ]
    cooked["active_rows_number"] = sum(o > 0 for o in state.rows)
    cooked["shortest_row"] = min((x for x in enumerate(state.rows) if x[1] > 0), key=lambda y: y[1])[0]
    cooked["longest_row"] = max((x for x in enumerate(state.rows)), key=lambda y: y[1])[0]
    cooked["nim_sum"] = nim_sum(state)

    brute_force = list()
    for m in cooked["possible_moves"]:
        tmp = deepcopy(state)
        tmp.nimming(m)
        brute_force.append((m, nim_sum(tmp)))
    cooked["brute_force"] = brute_force

    return cooked

def optimal_startegy(state: Nim):
    data = cook_status(state)
    return next((bf for bf in data["brute_force"] if bf[1] == 0), random.choice(data["brute_force"]))[0]

In [8]:
def eval_terminal(state: Nim):
    if not state:
        return -1
    else:
        return 0

In [9]:
def minmax(state: Nim,step: int):
    val = eval_terminal(state)
    possible_moves = [
        (r, o) for r, c in enumerate(state.rows) for o in range(1, c + 1) if state.k is None or o <= state.k
    ]

    #print(f"Mosse possibili {possible_moves}")
    
    step +=1

    if val != 0 or not possible_moves:
        return None, val
    evaluations = list()

    for ply in possible_moves:
        
        #print(f"Mossa corrente {ply}, giocatore {step%2}")
        tmp = deepcopy(state)
        tmp.nimming(ply)
        #print(f"stato attuale: {tmp}")
        _, val = minmax(tmp, step)
        evaluations.append((ply, -val))
        
        if -val == 1:
            break;

    

    #print(f"evaluation list: {evaluations}") 
    #print(f"Mossa presa effettivamente {max(evaluations, key=lambda k: k[1])}")   
    return max(evaluations, key=lambda k: k[1])

In [13]:
logging.getLogger().setLevel(logging.DEBUG)

nim = Nim(3)


    
logging.debug(f"status: Initial board  -> {nim}")
player = 0
while nim:
    if player == 0:
        ply, _ = minmax(nim,0)
    else:
        ply = optimal_startegy(nim)
    
    print(ply)
    nim.nimming(ply)
    logging.debug(f"status: After player {player} -> {nim}")
    player = 1 - player
winner = 1 - player
logging.info(f"status: Player {winner} won!")

DEBUG:root:status: Initial board  -> <1 3 5>
DEBUG:root:status: After player 0 -> <1 3 2>
DEBUG:root:status: After player 1 -> <1 3 0>
DEBUG:root:status: After player 0 -> <1 1 0>
DEBUG:root:status: After player 1 -> <1 0 0>
DEBUG:root:status: After player 0 -> <0 0 0>
INFO:root:status: Player 0 won!


(2, 3)
(2, 2)
(1, 2)
(1, 1)
(0, 1)
