In [5]:
from queue import PriorityQueue
import numpy as np

class PuzzleNode:
    def __init__(self, state, parent=None, move=None, depth=0, cost=0):
        self.state = state
        self.parent = parent
        self.move = move
        self.depth = depth
        self.cost = cost
        self.mismatch = self.mismatch_count()
        self.total_cost = cost + self.mismatch  # Overall cost: path cost + mismatch count
    
    def __lt__(self, other):
        return self.total_cost < other.total_cost
    
    def mismatch_count(self):
        goal_state = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 0]])
        return np.sum(self.state != goal_state) - 1  # Exclude the blank tile
    
    def get_neighbors(self):
        neighbors = []
        x, y = np.where(self.state == 0)
        x, y = int(x), int(y)
        moves = {'Up': (x - 1, y), 'Down': (x + 1, y), 'Left': (x, y - 1), 'Right': (x, y + 1)}
        
        for move, (nx, ny) in moves.items():
            if 0 <= nx < 3 and 0 <= ny < 3:
                new_state = self.state.copy()
                new_state[x, y], new_state[nx, ny] = new_state[nx, ny], new_state[x, y]
                neighbors.append(PuzzleNode(new_state, self, move, self.depth + 1, self.depth + 1))
        
        return neighbors
    
    def path(self):
        node, path = self, []
        while node:
            path.append(node)
            node = node.parent
        return path[::-1]

def solve_puzzle(start_state):
    start_node = PuzzleNode(np.array(start_state))
    goal_state = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 0]])
    frontier = PriorityQueue()
    frontier.put(start_node)
    explored = set()
    
    while not frontier.empty():
        node = frontier.get()
        
        if np.array_equal(node.state, goal_state):
            return node.path()
        
        explored.add(tuple(map(tuple, node.state)))
        
        neighbors = node.get_neighbors()
        neighbors.sort(key=lambda n: n.total_cost)  # Sort by overall cost
        
        print(f"Choosing move with lowest total cost at depth {node.depth}:")
        for neighbor in neighbors:
            print(f"Move: {neighbor.move}, Cost: {neighbor.cost}, Mismatch: {neighbor.mismatch}, Total Cost: {neighbor.total_cost}")
            print("State after move:")
            print(neighbor.state)
            print()
        
        if neighbors:
            chosen_neighbor = neighbors[0]
            print("Chosen move with lowest total cost:")
            print(f"Move: {chosen_neighbor.move}, Cost: {chosen_neighbor.cost}, Mismatch: {chosen_neighbor.mismatch}, Total Cost: {chosen_neighbor.total_cost}")
            print("Chosen state:")
            print(chosen_neighbor.state)
            print()
        
        for neighbor in neighbors:
            if tuple(map(tuple, neighbor.state)) not in explored:
                frontier.put(neighbor)
    
    return None

# Example usage:
initial_state = [[1, 2, 3], [0, 4, 6], [7, 5, 8]]
solution = solve_puzzle(initial_state)

if solution:
    for step, node in enumerate(solution):
        print(f"Step {step}: Move {node.move}")
        print(f"Cost: {node.cost}, Mismatch: {max(node.mismatch,0)}, Total Cost: {node.total_cost}")
        print("State:")
        print(node.state)
        print()
else:
    print("No solution found.")


Choosing move with lowest total cost at depth 0:
Move: Right, Cost: 1, Mismatch: 2, Total Cost: 3
State after move:
[[1 2 3]
 [4 0 6]
 [7 5 8]]

Move: Up, Cost: 1, Mismatch: 4, Total Cost: 5
State after move:
[[0 2 3]
 [1 4 6]
 [7 5 8]]

Move: Down, Cost: 1, Mismatch: 4, Total Cost: 5
State after move:
[[1 2 3]
 [7 4 6]
 [0 5 8]]

Chosen move with lowest total cost:
Move: Right, Cost: 1, Mismatch: 2, Total Cost: 3
Chosen state:
[[1 2 3]
 [4 0 6]
 [7 5 8]]

Choosing move with lowest total cost at depth 1:
Move: Down, Cost: 2, Mismatch: 1, Total Cost: 3
State after move:
[[1 2 3]
 [4 5 6]
 [7 0 8]]

Move: Up, Cost: 2, Mismatch: 3, Total Cost: 5
State after move:
[[1 0 3]
 [4 2 6]
 [7 5 8]]

Move: Left, Cost: 2, Mismatch: 3, Total Cost: 5
State after move:
[[1 2 3]
 [0 4 6]
 [7 5 8]]

Move: Right, Cost: 2, Mismatch: 3, Total Cost: 5
State after move:
[[1 2 3]
 [4 6 0]
 [7 5 8]]

Chosen move with lowest total cost:
Move: Down, Cost: 2, Mismatch: 1, Total Cost: 3
Chosen state:
[[1 2 3]
 [4 

  x, y = int(x), int(y)
