In [1]:
from planning_inference.parsers import parse_model, parse_problem, parse_plan, parse_trajectory, parse_hypothesis, parse_observation_sequence
from planning_inference.generator import generate_trajectory
from planning_inference.functions import generate_all_literals, get_matching_literals

from planning_inference.pddl import Conjunction, Literal, Type, TypedObject, Effect, Truth, NumericConstant, PrimitiveNumericExpression, Increase
from planning_inference.pddl import SensorModel

from planning_inference.observations import Trajectory, Hypothesis, State

from planning_inference import DecodingTask

from sensor_models import load_sensor_model

import os
import copy
from collections import defaultdict
from itertools import combinations
from random import choice, choices, shuffle
from statistics import mean
import glob
import time

In [2]:
def launch_experiments(domain, task, timeout):
    Ms = load_sensor_model(domain)
    
    observabilities = [30, 50, 70]
       
    for observability in observabilities:
        base_path = "benchmark/%s/%s/%s/" % (domain, task, str(observability))

        problems = sorted(glob.glob(base_path + "*"))

        for problem in problems:
            costs = []
            times = []

            print(problem)

            # Planning Model
            Mp = parse_model(problem + "/domain")
            
            # Real Hypothesis
            with open(problem + "/sol", "r") as f:
                correct_h = int(f.read())

            print("Correct hypothesis: %d" % correct_h)

            # Observation sequence
#             obs = parse_observation_sequence(problem + "/obs")

            # Hypotheses
            h_files = sorted(glob.glob(problem + "/hyp*"))

            for i in range(len(h_files)):
                h = parse_LTLHypothesis(h_files[i])

                #Build a decoding problem for each hypothesis
                T = DecodingTaskLTL(Mp,Ms,h)

                tic = time.time()
                sol = T.decode(clean=True, planner="downward", t=timeout)
                toc = time.time()


                if len(sol.actions) == 0:
                    cost = 1000
                else:
                    cost = len(sol.actions)
                    sol.to_file(problem + "/plan.%s" % str(i).zfill(2))

                duration = toc - tic

                print("Hypothesis %d: %d, %.2f" % (i, cost, duration))

                costs.append(cost)
                times.append(duration)

            with open(problem + "/costs", "w") as f:
                f.write(" ".join(map(str, costs)))

            with open(problem + "/times", "w") as f:
                f.write(" ".join(map(str, times)))
    

In [3]:
domain = "floortile"
timeout = 120

In [4]:
# MONITORING

task = "monitoring"
launch_experiments(domain, task, timeout)

benchmark/floortile/monitoring/30/P00
Correct hypothesis: 2
Hypothesis 0: 1000, 2.81
Hypothesis 1: 1000, 2.19
Hypothesis 2: 16, 2.35
Hypothesis 3: 18, 2.64
Hypothesis 4: 1000, 2.17
Hypothesis 5: 1000, 2.21
benchmark/floortile/monitoring/30/P01
Correct hypothesis: 2
Hypothesis 0: 16, 2.31
Hypothesis 1: 1000, 2.25
Hypothesis 2: 16, 2.25
Hypothesis 3: 14, 2.05
Hypothesis 4: 15, 2.15
Hypothesis 5: 15, 2.19
benchmark/floortile/monitoring/30/P02
Correct hypothesis: 5
Hypothesis 0: 1000, 121.33
Hypothesis 1: 1000, 2.22
Hypothesis 2: 1000, 2.23
Hypothesis 3: 1000, 2.21
Hypothesis 4: 1000, 121.33
Hypothesis 5: 18, 2.35
benchmark/floortile/monitoring/30/P03
Correct hypothesis: 0
Hypothesis 0: 19, 2.87
Hypothesis 1: 1000, 2.24
Hypothesis 2: 1000, 2.20
Hypothesis 3: 1000, 2.24
Hypothesis 4: 17, 2.40
Hypothesis 5: 1000, 2.20
benchmark/floortile/monitoring/30/P04
Correct hypothesis: 3
Hypothesis 0: 17, 2.26
Hypothesis 1: 17, 2.29
Hypothesis 2: 18, 2.39
Hypothesis 3: 18, 2.50
Hypothesis 4: 1000, 2.26

In [5]:
# PREDICTION

task = "prediction"
launch_experiments(domain, task, timeout)

benchmark/floortile/prediction/30/P00
Correct hypothesis: 4
Hypothesis 0: 1000, 120.36
Hypothesis 1: 1000, 153.85
Hypothesis 2: 1000, 120.37
Hypothesis 3: 1000, 120.37
Hypothesis 4: 32, 38.15
Hypothesis 5: 1000, 120.37
benchmark/floortile/prediction/30/P01
Correct hypothesis: 4
Hypothesis 0: 1000, 154.22
Hypothesis 1: 1000, 120.52
Hypothesis 2: 1000, 154.23
Hypothesis 3: 1000, 120.45
Hypothesis 4: 32, 39.67
Hypothesis 5: 32, 37.45
benchmark/floortile/prediction/30/P02
Correct hypothesis: 0
Hypothesis 0: 34, 58.99
Hypothesis 1: 1000, 120.46
Hypothesis 2: 34, 60.17
Hypothesis 3: 34, 58.90
Hypothesis 4: 1000, 120.47
Hypothesis 5: 34, 59.32
benchmark/floortile/prediction/30/P03
Correct hypothesis: 4
Hypothesis 0: 1000, 120.41
Hypothesis 1: 1000, 120.39
Hypothesis 2: 35, 83.85
Hypothesis 3: 1000, 120.40
Hypothesis 4: 35, 99.52
Hypothesis 5: 1000, 120.39
benchmark/floortile/prediction/30/P04
Correct hypothesis: 4
Hypothesis 0: 1000, 120.48
Hypothesis 1: 1000, 120.46
Hypothesis 2: 1000, 120.4

In [6]:
# HINDSIGHT

task = "hindsight"
launch_experiments(domain, task, timeout)

benchmark/floortile/hindsight/30/P00
Correct hypothesis: 0
Hypothesis 0: 24, 4.19
Hypothesis 1: 25, 6.01
Hypothesis 2: 25, 6.07
Hypothesis 3: 25, 40.33
Hypothesis 4: 24, 4.13
Hypothesis 5: 24, 38.17
benchmark/floortile/hindsight/30/P01
Correct hypothesis: 2
Hypothesis 0: 31, 52.53
Hypothesis 1: 31, 49.16
Hypothesis 2: 31, 52.25
Hypothesis 3: 31, 49.79
Hypothesis 4: 31, 53.73
Hypothesis 5: 31, 53.32
benchmark/floortile/hindsight/30/P02
Correct hypothesis: 3
Hypothesis 0: 1000, 120.45
Hypothesis 1: 1000, 120.45
Hypothesis 2: 1000, 120.45
Hypothesis 3: 1000, 120.45
Hypothesis 4: 1000, 120.45
Hypothesis 5: 1000, 120.46
benchmark/floortile/hindsight/30/P03
Correct hypothesis: 0
Hypothesis 0: 30, 24.25
Hypothesis 1: 30, 24.29
Hypothesis 2: 30, 24.93
Hypothesis 3: 30, 24.35
Hypothesis 4: 30, 24.15
Hypothesis 5: 30, 24.35
benchmark/floortile/hindsight/30/P04
Correct hypothesis: 5
Hypothesis 0: 35, 92.69
Hypothesis 1: 34, 83.79
Hypothesis 2: 34, 92.51
Hypothesis 3: 34, 66.85
Hypothesis 4: 34, 6