In [43]:
%matplotlib notebook

import matplotlib.pyplot as plt
import datetime
from __future__ import division
from random import choice
from math import log, sqrt

In [10]:
plt.axes()

circle = plt.Circle((0, 0), radius=0.75, fc='y')
plt.gca().add_patch(circle)

plt.axis('scaled')
plt.show()

<IPython.core.display.Javascript object>

In [258]:
class Board(object):
    def __init__(self, n, m, d, Rs, Rc, O):
        self.n = n
        self.m = m
        self.d = d
        self.Rs = Rs
        self.Rc = Rc
        self.O = O
        O2 = []
        for x1, y1, x2, y2 in O:
            for x in range(x1, x2+1):
                for y in range(y1, y2+1):
                    O2.append((x, y))
        self.O2 = O2
        self.O2set = set(O2)
    
    def start(self):
        # Returns a representation of the starting state of the game.
        return [(-1,-1)] * self.m

    def next_state(self, state, play):
        # Takes the game state, and the move to be applied.
        # Returns the new game state.
        try:
            t = next(i for i,p in enumerate(state) if p[0] < 0 or p[1] < 0)
        except StopIteration:
            return state
        state_copy = state[:]
        state_copy[t] = play
        return state_copy

    def legal_plays(self, state_history):
        # Takes a sequence of game states representing the full
        # game history, and returns the full list of moves that
        # are legal plays for the current player.
        state = state_history[-1]
        legal = []
#         try:
#             t = next(i for i,p in enumerate(state) if p[0] < 0 or p[1] < 0)
#         except StopIteration:
#             return []
        n = self.n
        m = self.m
        Rs = self.Rs
        Rc = self.Rc
        t = -1
        for i in range(m):
            try:
                x, y = state[i]
            except TypeError:
                return []
            if x < 0 or y < 0:
                t = i
                break
        if t == -1:
            return []
        if t == 0:
            # First iteration anywhere but inside obstacles
            for j in range(0, n+1):
                for k in range(0, n+1):
                    if (j, k) not in self.O2set:
                        legal.append((j, k))
        else:
            # Loop through deployed positions
            for i in range(0, t):
                x, y = state[i]
                # Eliminate out of bound positions
                if x < 0 or y < 0 or x > n or y > n:
                    continue
                # Loop through possible deploy positions
                # (j, k) = possible position
                for j in range(x - Rc[i] - Rc[t] + 1, x + Rc[i] + Rc[t]):
                    for k in range(y - Rc[i] - Rc[t] + 1, y + Rc[i] + Rc[t]):
                        # Eliminate out of bound positions
                        if j < 0 or k < 0 or j > n or k > n:
                            continue
                        # Eliminate deployed positions
                        if (j, k) in state:
                            continue
                        # Eliminate inside obstacles
                        if (j, k) in self.O2:
                            continue
                        overlap = []
                        # Loop through possible coverage
                        # (u, v) = points in sensor i
                        # Need to determine if (u, v) is in coverage of sensor t deployed at (j,k)
                        for u in range(x - Rc[i], x + Rc[i] + 1):
                            for v in range(y - Rc[i], y + Rc[i] + 1):
                                # Eliminate out of bound
                                if u < 0 or v < 0 or u > n or v > n:
                                    continue
                                # Eliminate out of circle
                                if sqrt((u-x)*(u-x) + (v-y)*(v-y)) > Rc[i]:
                                    continue
                                # Determine if (u,v) is covered by sensor t
                                if sqrt((u-j)*(u-j) + (v-k)*(v-k)) <= Rc[t]:
                                    overlap.append((u, v))
                        if len(overlap) >= 2 and set(overlap).issubset(self.O2set) is False:
                            legal.append((j,k))
        return legal

    def winner(self, state_history):
        # Takes a sequence of game states representing the full
        # game history.  If the game is now won, return the player
        # number.  If the game is still ongoing, return zero.  If
        # the game is tied, return a different distinct value, e.g. -1.
        pass

In [247]:
class MonteCarlo(object):
    def __init__(self, board, **kwargs):
        # Takes an instance of a Board and optionally some keyword
        # arguments.  Initializes the list of game states and the
        # statistics tables.
        self.board = board
        self.states = []
        seconds = kwargs.get('time', 5)
        self.calculation_time = datetime.timedelta(seconds=seconds)
        self.max_moves = kwargs.get('max_moves', 100)
        self.C = kwargs.get('C', 1.4)
        self.scores = {}
        self.plays = {}
        pass

    def update(self, state):
        # Takes a game state, and appends it to the history.
        self.states.append(state)
        pass

    def get_play(self):
        # Causes the AI to calculate the best move from the
        # current game state and return it.
        self.max_depth = 0
        state = self.states[-1]
        legal = self.board.legal_plays(self.states[:])

        # Bail out early if there is no real choice to be made.
        if not legal:
            return
        if len(legal) == 1:
            return legal[0]

        games = 0
        begin = datetime.datetime.utcnow()
        while datetime.datetime.utcnow() - begin < self.calculation_time:
            self.run_simulation()
            games += 1

        moves_states = [(p, self.board.next_state(state, p)) for p in legal]

        # Display the number of calls of `run_simulation` and the
        # time elapsed.
        print(games, datetime.datetime.utcnow() - begin)

        # Pick the move with the highest score.
        percent_scores, move = max(
            (self.scores.get(tuple(S), 0) /
             self.plays.get(tuple(S), 1),
             p)
            for p, S in moves_states
        )

        # Display the stats for each possible play.
        for x in sorted(
            ((self.scores.get(tuple(S), 0) /
              self.plays.get(tuple(S), 1),
              self.scores.get(tuple(S), 0),
              self.plays.get(tuple(S), 0), p)
             for p, S in moves_states),
            reverse=True
        ):
            print ("{3}: {0:.2f} ({1} / {2})".format(*x))

        print ("Maximum depth searched:", self.max_depth)

        return move

    def run_simulation(self):
        # Plays out a "random" game from the current position,
        # then updates the statistics tables with the result.
        
        # A bit of an optimization here, so we have a local
        # variable lookup instead of an attribute access each loop.
        plays, scores = self.plays, self.scores

        visited_states = set()
        states_copy = self.states[:]
        state = states_copy[-1]

        expand = True
        for t in range(1, self.max_moves + 1):
            legal = self.board.legal_plays(states_copy)
            
            moves_states = [(p, self.board.next_state(state, p)) for p in legal]
            
            if not moves_states:
                continue

            if plays.get(tuple(state)) and plays[tuple(state)] >= 10 and all(plays.get(tuple(S)) for p, S in moves_states):
                # If we have stats on all of the legal moves here, use them.
                log_total = log(
                    sum(plays[tuple(S)] for p, S in moves_states)
                )
                value, move, state = max(
                    ((scores[tuple(S)] / plays[tuple(S)]) +
                     self.C * sqrt(log_total / plays[tuple(S)]), p, S)
                    for p, S in moves_states
                )
            else:
                # Otherwise, just make an arbitrary decision.
                move, state = choice(moves_states)

            states_copy.append(state)

            if expand and tuple(state) not in plays:
                expand = False
                plays[tuple(state)] = 0
                scores[tuple(state)] = 0
                if t > self.max_depth:
                    self.max_depth = t

            visited_states.add(tuple(state))

#             winner = self.board.winner(states_copy)
#             if winner:
#                 break

        for state in visited_states:
            if tuple(state) not in plays:
                continue
            plays[tuple(state)] += 1
            cov = 0
            for x in range(self.board.n+1):
                for y in range(self.board.n+1):
                    for i in range(self.board.m):
                        j, k = state[i]
                        if sqrt((x-j)*(x-j) + (y-k)*(y-k)) <= self.board.Rs[i]:
                            cov += 1
                            break
            scores[tuple(state)] += cov

In [175]:
n = 5
m = 4
d = 3
Rs = (1,1,1,2)
Rc = (2,2,2,3)
O = [(0,0,1,1),(3,3,5,5),(6,4,7,7)]
board = Board(n, m, d, Rs, Rc, O)
history = [[] for i in range(m+1)]
history[0] = [board.start()]
for i in range(0, m):
    for state in history[i]:
        legal_plays = board.legal_plays([state])
        if not legal_plays:
            continue
        for play in legal_plays:
            history[i+1].append(board.next_state(state, play))

possibles = history[-1]

count = len(possibles)
worst = 1
for i in range(0, m):
    worst *= (n+1)*(n+1) - len(board.O2) - i

print(count, worst, count/worst)

max_cov = 0
max_deploy = None
for deploy in possibles:
    cov = 0
    for x in range(n+1):
        for y in range(n+1):
            for i in range(m):
                j, k = deploy[i]
                if sqrt((x-j)*(x-j) + (y-k)*(y-k)) <= Rs[i]:
                    cov += 1
                    break
    if cov > max_cov:
        max_deploy = deploy[:]
        max_cov = cov

plt.clf()
plt.axes()

for i in range(0, m):
    x, y = max_deploy[i]
    circle = plt.Circle((x, y), radius=Rs[i], fc='r', alpha=0.3)
    plt.gca().add_patch(circle)
    circle = plt.Circle((x, y), radius=Rc[i], fc='y', alpha=0.3)
    plt.gca().add_patch(circle)
    circle = plt.Circle((x, y), radius=0.1, fc='r', alpha=1)
    plt.gca().add_patch(circle)

for j in range(0, d):
    x1, y1, x2, y2 = O[j]
    rect = plt.Rectangle((x1, y1), x2 - x1, y2 - y1)
    plt.gca().add_patch(rect)
    
for i in range(0, m):
    x, y = max_deploy[i]
    circle = plt.Circle((x, y), radius=0.1, fc='r', alpha=1)
    plt.gca().add_patch(circle)

plt.axis('scaled')
plt.grid(color='black', linestyle='-', alpha=0.5, linewidth=1)
plt.show()

417120 32760 12.732600732600732


<IPython.core.display.Javascript object>

In [266]:
n = 10
m = 6
d = 3
Rs = (1,1,1,2,2,2)
Rc = (2,2,2,3,3,4)
O = [(0,0,1,1),(3,3,5,5),(6,4,7,7)]
board = Board(n, m, d, Rs, Rc, O)
montecarlo = MonteCarlo(board)
montecarlo.update(board.start())
for i in range(0, m):
    move = montecarlo.get_play()
    print('This is move', move)
    montecarlo.update(board.next_state(montecarlo.states[-1], move))

max_deploy = montecarlo.states[-1]
print(max_deploy)

plt.clf()
plt.axes()

for i in range(0, m):
    x, y = max_deploy[i]
    circle = plt.Circle((x, y), radius=Rs[i], fc='r', alpha=0.3)
    plt.gca().add_patch(circle)
    circle = plt.Circle((x, y), radius=Rc[i], fc='y', alpha=0.3)
    plt.gca().add_patch(circle)
    circle = plt.Circle((x, y), radius=0.1, fc='r', alpha=1)
    plt.gca().add_patch(circle)

for j in range(0, d):
    x1, y1, x2, y2 = O[j]
    rect = plt.Rectangle((x1, y1), x2 - x1, y2 - y1)
    plt.gca().add_patch(rect)
    
for i in range(0, m):
    x, y = max_deploy[i]
    circle = plt.Circle((x, y), radius=0.1, fc='r', alpha=1)
    plt.gca().add_patch(circle)

plt.axis('scaled')
plt.grid(color='black', linestyle='-', alpha=0.5, linewidth=1)
plt.show()

348 0:00:05.008558
(1, 2): 6.00 (42 / 7)
(9, 6): 6.00 (36 / 6)
(8, 4): 6.00 (36 / 6)
(4, 9): 6.00 (36 / 6)
(3, 1): 6.00 (36 / 6)
(2, 5): 6.00 (36 / 6)
(1, 9): 6.00 (36 / 6)
(9, 9): 6.00 (30 / 5)
(8, 8): 6.00 (30 / 5)
(8, 7): 6.00 (30 / 5)
(8, 6): 6.00 (30 / 5)
(5, 7): 6.00 (30 / 5)
(2, 4): 6.00 (30 / 5)
(9, 7): 6.00 (24 / 4)
(9, 4): 6.00 (24 / 4)
(8, 2): 6.00 (24 / 4)
(8, 1): 6.00 (24 / 4)
(7, 9): 6.00 (24 / 4)
(5, 8): 6.00 (24 / 4)
(4, 7): 6.00 (24 / 4)
(4, 1): 6.00 (24 / 4)
(1, 8): 6.00 (24 / 4)
(9, 8): 6.00 (18 / 3)
(9, 5): 6.00 (18 / 3)
(9, 3): 6.00 (18 / 3)
(7, 8): 6.00 (18 / 3)
(7, 3): 6.00 (18 / 3)
(7, 2): 6.00 (18 / 3)
(5, 2): 6.00 (18 / 3)
(5, 1): 6.00 (18 / 3)
(4, 8): 6.00 (18 / 3)
(4, 6): 6.00 (18 / 3)
(3, 9): 6.00 (18 / 3)
(3, 7): 6.00 (18 / 3)
(3, 6): 6.00 (18 / 3)
(2, 7): 6.00 (18 / 3)
(2, 3): 6.00 (18 / 3)
(2, 2): 6.00 (18 / 3)
(1, 7): 6.00 (18 / 3)
(1, 6): 6.00 (18 / 3)
(1, 3): 6.00 (18 / 3)
(8, 5): 6.00 (12 / 2)
(8, 3): 6.00 (12 / 2)
(7, 1): 6.00 (12 / 2)
(6, 9): 6.00 

607 0:00:05.007554
(2, 5): 54.00 (378 / 7)
(2, 5): 54.00 (378 / 7)
(2, 4): 54.00 (378 / 7)
(2, 4): 54.00 (378 / 7)
(3, 6): 54.00 (216 / 4)
(3, 6): 54.00 (216 / 4)
(2, 7): 54.00 (54 / 1)
(1, 5): 53.00 (371 / 7)
(1, 5): 53.00 (371 / 7)
(2, 2): 53.00 (159 / 3)
(1, 6): 53.00 (159 / 3)
(2, 9): 53.00 (106 / 2)
(2, 8): 53.00 (106 / 2)
(2, 1): 53.00 (106 / 2)
(1, 8): 53.00 (106 / 2)
(1, 3): 53.00 (106 / 2)
(1, 2): 53.00 (106 / 2)
(1, 4): 53.00 (53 / 1)
(1, 9): 52.00 (260 / 5)
(3, 8): 52.00 (156 / 3)
(3, 2): 52.00 (156 / 3)
(3, 7): 52.00 (52 / 1)
(4, 6): 51.00 (459 / 9)
(4, 6): 51.00 (459 / 9)
(4, 6): 51.00 (459 / 9)
(3, 9): 51.00 (255 / 5)
(3, 1): 51.00 (102 / 2)
(5, 6): 50.00 (700 / 14)
(5, 6): 50.00 (700 / 14)
(5, 6): 50.00 (700 / 14)
(5, 6): 50.00 (700 / 14)
(5, 6): 50.00 (700 / 14)
(4, 7): 50.00 (350 / 7)
(4, 7): 50.00 (350 / 7)
(2, 0): 50.00 (300 / 6)
(2, 10): 50.00 (250 / 5)
(0, 6): 50.00 (200 / 4)
(0, 3): 50.00 (200 / 4)
(0, 8): 50.00 (150 / 3)
(0, 4): 50.00 (150 / 3)
(3, 10): 50.00 (10

In [195]:
a = {}
a[([1],)] =1

TypeError: unhashable type: 'list'