In [None]:
from random import random
from functools import reduce
from collections import namedtuple
from queue import PriorityQueue

import numpy as np

In [None]:
PROBLEM_SIZE = 500
NUM_SETS = 10_000
SETS = tuple(
    np.array([random() < 0.3 for _ in range(PROBLEM_SIZE)]) for _ in range(NUM_SETS)
)
State = namedtuple('State', ['taken', 'not_taken'])

In [None]:
def goal_check(state):
    return np.all(
        reduce(
            np.logical_or, 
            [SETS[i] for i in state.taken], 
            np.array([False for _ in range(PROBLEM_SIZE)]))
        )

def distance (state):
    return PROBLEM_SIZE - sum(
        reduce(
            np.logical_or,
            [SETS[i] for i in state.taken],
            np.array([False for _ in range(PROBLEM_SIZE)]))
        )

def weigth(state):
    return distance(state) + len(state.taken)

In [None]:
assert goal_check(
    State(set(range(NUM_SETS)), set())
), "Problem not solvable"

In [None]:
frontier = PriorityQueue()
state = State(set(), set(range(NUM_SETS)))
frontier.put((weigth(state), state))

counter = 0
_, current_state = frontier.get()
while not goal_check(current_state):
    counter += 1
    for action in current_state[1]:
        new_state = State(
            current_state.taken ^ {action},
            current_state.not_taken ^ {action},
        )
        frontier.put((weigth(new_state), new_state))
    _, current_state = frontier.get()

print(
    f"Solved in {counter:,} steps ({len(current_state.taken)} tiles)"
)

In [None]:
current_state.taken

In [None]:
SETS[0]