In [1]:
using Interact
using HDF5
using PGFPlots

In [None]:
# debug visualization

In [None]:
input_filepath = "../../data/datasets/11_27/risk_15.h5"
data = JLD.load(input_filepath)
num_samples = size(data["risk/features"], 2)
features = reshape(data["risk/features"], num_samples)
targets = reshape(data["risk/targets"], num_samples);

In [None]:
a = Axis(Plots.Scatter(features, targets, markSize=3), 
    xlabel = "Distance (m) from Car", 
    ylabel = "Pr(Collision)", 
    title = "Distance vs Collision Probability",
    width="24cm", 
    height="8cm")

In [None]:
# risk dataset analysis

In [None]:
input_filepath = "../../data/datasets/risk.jld"
input_filepath = "../../data/datasets/risk.jld"
data = JLD.load(input_filepath)
num_features, num_samples = size(data["features"])
features = data["features"]
targets = data["targets"];

In [None]:
# scatter each feature against pr(collision)
@manipulate for f = collect(1:num_features)
    a = Axis(Plots.Scatter(features[f,:], targets[1,:], markSize=3), 
        xlabel = "Feature", 
        ylabel = "Pr(Collision)", 
        title = "Feature vs Collision Probability",
        width="20cm", 
        height="12cm")
    a
end

In [None]:
# compare two datasets
input_filepath_1 = "../../data/datasets/risk_10k_3_sec_burn_in.jld"
input_filepath_2 = "../../data/datasets/risk_10k_5_sec_burn_in.jld"
data_1 = JLD.load(input_filepath_1)
features_1, targets_1 = data_1["features"], data_1["targets"];
data_2 = JLD.load(input_filepath_2)
features_2, targets_2 = data_2["features"], data_2["targets"];
num_features, num_samples = size(data_1["features"]);
num_sample_to_plot = 128

In [None]:
# scatter each feature against pr(collision) for each dataset
g = GroupPlot(2, 1, groupStyle = "horizontal sep = 1.75cm, vertical sep = 1.5cm")
@manipulate for f = collect(1:num_features)
    a = Axis(Plots.Scatter(features_1[f,1:num_sample_to_plot], targets_1[1,1:num_sample_to_plot], markSize=3), 
        xlabel = "Feature", 
        ylabel = "Pr(Collision)", 
        title = "Dataset 1: Feature vs Collision Probability",
        width="12cm", 
        height="12cm")
    push!(g, a)
    a = Axis(Plots.Scatter(features_2[f,1:num_sample_to_plot], targets_2[1,1:num_sample_to_plot], markSize=3), 
        xlabel = "Feature", 
        ylabel = "Pr(Collision)", 
        title = "Dataset 2: Feature vs Collision Probability",
        width="12cm", 
        height="12cm")
    push!(g, a)
end
g

In [2]:
input_filepath = "../../data/datasets/risk.h5"
data = h5open(input_filepath)
features = read(data["risk/features"])
targets = read(data["risk/targets"]);

In [3]:
println(size(features))
println(size(targets))

(62,1162)
(2,1162)


In [4]:
println(sum(targets, 2))
println(mean(targets, 2))

[183.5; 8.0]
[0.157917; 0.00688468]


In [5]:
btwn = find(0 .< targets .< 1.) 
println(btwn)
println(targets)

[7,13,21,31,33,43,47,54,63,77,81,139,141,143,149,159,163,185,187,189,191,199,201,225,227,231,234,267,317,331,355,356,359,379,385,387,388,393,395,401,413,421,439,465,495,496,501,505,507,511,526,529,541,555,559,571,572,615,649,741,745,761,767,791,801,803,813,827,828,837,854,861,881,897,900,927,953,955,967,987,997,1019,1021,1025,1027,1065,1073,1077,1078,1083,1097,1105,1127,1165,1209,1231,1251,1259,1281,1295,1309,1433,1447,1449,1459,1515,1521,1525,1565,1567,1573,1581,1595,1603,1607,1618,1623,1653,1659,1667,1681,1685,1723,1725,1729,1743,1745,1767,1781,1792,1825,1827,1843,1853,1855,1875,1887,1921,1937,1945,1963,1979,1999,2031,2032,2046,2053,2069,2071,2085,2101,2129,2135,2137,2151,2179,2181,2223,2233,2234,2245,2251,2263,2303,2317]
[0.0 1.0 0.0 0.5 0.0 0.0 0.5 0.0 1.0 0.0 0.5 0.0 0.0 0.0 0.0 0.5 0.5 0.0 0.0 0.0 1.0 0.5 0.0 0.5 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.5 0.0 0.0 0.0 0.0 0.0 0.0 0.5 0.0 0.5 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 1.0 1.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 0.0 1.0 1