In [1]:
%load_ext autoreload
%autoreload 2
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0"

In [2]:
import numpy as np
import matplotlib.pyplot as plt
import scipy.interpolate as interpolate
import simulators.jla_supernovae.jla_simulator as jla
import ndes.ndes as ndes
import delfi.delfi as delfi
import compression.score.score as score
import distributions.priors as priors
import tensorflow as tf
import getdist
from getdist import plots, MCSamples
import compression.IMNN.information_maximiser.utils as utils
import compression.IMNN.information_maximiser.IMNN as IMNN
tf.logging.set_verbosity(tf.logging.ERROR)
%matplotlib inline

In [3]:
### SET UP FOR SIMULATION CODE ###

JLASimulator = jla.JLA_Model()

# Simulator function: This must be of the form simulator(theta, seed, args) -> simulated data vector
def simulator(theta, seed, simulator_args, batch):
    
    return JLASimulator.simulation(theta, seed)
simulator_args = None

  dtype = None, names = True)


In [4]:
### SET UP THE PRIOR ###

# Define prior limits and boundaries
lower = np.array([0, -1.5, -20, 0, 0, -0.5])
upper = np.array([0.6, 0, -18, 1, 6, 0.5])
prior_covariance = np.diag([0.4, 0.75, 0.1, 0.025, 0.25, 0.05])**2
prior_covariance[0,1] = prior_covariance[1,0] = -0.8*0.4*0.75
prior_mean = np.array([  0.3  ,  -0.75 , -19.05 ,   0.125,   2.6  ,  -0.05 ])
prior = priors.TruncatedGaussian(prior_mean, prior_covariance, lower, upper)

In [5]:
### SET UP THE COMPRESSOR ###

# Fiducial parameters
theta_fiducial = np.array([  0.20181324,  -0.74762939, -19.04253368,   0.12566322,   2.64387045, -0.05252869])

# Expected data (mean) and covariance
mu = JLASimulator.apparent_magnitude(theta_fiducial)
Cinv = JLASimulator.Cinv

# Calculate derivatives of the expected power spectrum
h = np.array(abs(theta_fiducial))*0.01
dmudt = JLASimulator.dmudt(theta_fiducial, h)

# Define compression as score-MLE of a Wishart likelihood
Compressor = score.Gaussian(len(JLASimulator.data), theta_fiducial, mu = mu, Cinv = Cinv, dmudt = dmudt, prior_mean = prior_mean, prior_covariance = prior_covariance)

# Compute the Fisher matrix
Compressor.compute_fisher()

# Pull out Fisher matrix inverse
Finv = Compressor.Finv

# Compressor function: This must have the form compressor(data, args) -> compressed summaries (pseudoMLE)
def compressor(d, compressor_args):
    return Compressor.scoreMLE(d)
compressor_args = None

In [6]:
### LOAD IN THE DATA VECTOR ###
#data = compressor(JLASimulator.data, compressor_args)
data = JLASimulator.data

In [7]:
# Shape of the input
input_shape = [len(data)]

In [8]:
# Run sims for training set

# Run sims at fiducial parameters
n_s = 10000
n_train = 1
t = np.array([simulator(theta_fiducial, np.random.randint(1e8), simulator_args=None, batch=1) for i in range(n_s)])
tt = np.array([simulator(theta_fiducial, np.random.randint(1e8), simulator_args=None, batch=1) for i in range(n_s)])

# How many sims to run for the derivatives
derivative_fraction = 0.05
n_p = int(n_s * derivative_fraction)

# Set the seed
seed = np.random.randint(1e6)

# Forward steps
np.random.seed(seed)
t_m = np.zeros((n_p, len(theta_fiducial), len(data)))
tt_m = np.zeros((n_p, len(theta_fiducial), len(data)))
for a in range(len(theta_fiducial)):
    theta = np.copy(theta_fiducial)
    theta[a] = theta_fiducial[a] - h[a]
    t_m[:, a, :] = np.array([simulator(theta, np.random.randint(1e8), simulator_args=None, batch=1) for i in range(n_p)])
    tt_m[:, a, :] = np.array([simulator(theta, np.random.randint(1e8), simulator_args=None, batch=1) for i in range(n_p)])

# Backward steps
np.random.seed(seed)
t_p = np.zeros((n_p, len(theta_fiducial), len(data)))
tt_p = np.zeros((n_p, len(theta_fiducial), len(data)))
for a in range(len(theta_fiducial)):
    theta = np.copy(theta_fiducial)
    theta[a] = theta_fiducial[a] + h[a]
    t_p[:, a, :] = np.array([simulator(theta, np.random.randint(1e8), simulator_args=None, batch=1) for i in range(n_p)])
    tt_p[:, a, :] = np.array([simulator(theta, np.random.randint(1e8), simulator_args=None, batch=1) for i in range(n_p)])
np.random.seed()

der_den = 1. / (2. * h)

In [9]:
data = {"x_central": t, "x_m": t_m, "x_p": t_p, "x_central_test": tt, "x_m_test": tt_m, "x_p_test": tt_p}

In [10]:
# IMNN network set-up
parameters = {
    'verbose': True,
    'number of simulations': n_s,
    'fiducial θ': theta_fiducial,
    'derivative denominator': der_den,
    'differentiation fraction': derivative_fraction,
    'number of summaries': len(theta_fiducial),
    'calculate MLE': True,
    'prebuild': True,
    'input shape': input_shape,
    'preload data': data,
    'save file': "data/saved_model",
    'wv': 0.,
    'bb': 0.1,
    'activation': tf.nn.leaky_relu,
    'α': 0.01,
    'hidden layers': [740, 300, 100, 50],
}

# Initialise the network
n = IMNN.IMNN(parameters = parameters)

# Build the network
η = 1e-3 # learning rate
tf.reset_default_graph()
n.setup(η = η)

saving model as data/saved_model.meta
network architecture is [[740], 740, 300, 100, 50, 6].
Tensor("x:0", shape=(?, 740), dtype=float32)
Tensor("IMNN/layer_1/dense_1/mul:0", shape=(?, 740), dtype=float32)
Tensor("IMNN/layer_2/dense_2/mul:0", shape=(?, 300), dtype=float32)
Tensor("IMNN/layer_3/dense_3/mul:0", shape=(?, 100), dtype=float32)
Tensor("IMNN/layer_4/dense_4/mul:0", shape=(?, 50), dtype=float32)
Tensor("IMNN/layer_5/LeakyRelu:0", shape=(?, 6), dtype=float32)
Tensor("output:0", shape=(?, 6), dtype=float32)
Tensor("GatherNd:0", shape=(10000, 740), dtype=float32)
Tensor("IMNN_1/layer_1/dense_1/mul:0", shape=(10000, 740), dtype=float32)
Tensor("IMNN_1/layer_2/dense_2/mul:0", shape=(10000, 300), dtype=float32)
Tensor("IMNN_1/layer_3/dense_3/mul:0", shape=(10000, 100), dtype=float32)
Tensor("IMNN_1/layer_4/dense_4/mul:0", shape=(10000, 50), dtype=float32)
Tensor("IMNN_1/layer_5/LeakyRelu:0", shape=(10000, 6), dtype=float32)
Tensor("Reshape:0", shape=(3000, 740), dtype=float32)
Tens

In [11]:
# Train the IMNN
num_epochs = 300
keep_rate = 0.8
n.train(num_epochs = num_epochs, n_train = n_train, keep_rate = keep_rate, history = True)

  0%|          | 0/300 [00:00<?, ?it/s]

InvalidArgumentError: Input is not invertible.
	 [[node inverse_central_covariance (defined at /Users/justinalsing/Dropbox/science/delfi/master/delfi/compression/IMNN/information_maximiser/IMNN.py:401)  = MatrixInverse[T=DT_FLOAT, adjoint=false, _device="/job:localhost/replica:0/task:0/device:CPU:0"](central_covariance)]]

Caused by op 'inverse_central_covariance', defined at:
  File "/usr/local/Cellar/python/3.6.5_1/Frameworks/Python.framework/Versions/3.6/lib/python3.6/runpy.py", line 193, in _run_module_as_main
    "__main__", mod_spec)
  File "/usr/local/Cellar/python/3.6.5_1/Frameworks/Python.framework/Versions/3.6/lib/python3.6/runpy.py", line 85, in _run_code
    exec(code, run_globals)
  File "/usr/local/lib/python3.6/site-packages/ipykernel_launcher.py", line 16, in <module>
    app.launch_new_instance()
  File "/usr/local/lib/python3.6/site-packages/traitlets/config/application.py", line 658, in launch_instance
    app.start()
  File "/usr/local/lib/python3.6/site-packages/ipykernel/kernelapp.py", line 505, in start
    self.io_loop.start()
  File "/usr/local/lib/python3.6/site-packages/tornado/platform/asyncio.py", line 132, in start
    self.asyncio_loop.run_forever()
  File "/usr/local/Cellar/python/3.6.5_1/Frameworks/Python.framework/Versions/3.6/lib/python3.6/asyncio/base_events.py", line 422, in run_forever
    self._run_once()
  File "/usr/local/Cellar/python/3.6.5_1/Frameworks/Python.framework/Versions/3.6/lib/python3.6/asyncio/base_events.py", line 1432, in _run_once
    handle._run()
  File "/usr/local/Cellar/python/3.6.5_1/Frameworks/Python.framework/Versions/3.6/lib/python3.6/asyncio/events.py", line 145, in _run
    self._callback(*self._args)
  File "/usr/local/lib/python3.6/site-packages/tornado/ioloop.py", line 758, in _run_callback
    ret = callback()
  File "/usr/local/lib/python3.6/site-packages/tornado/stack_context.py", line 300, in null_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 1233, in inner
    self.run()
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 1147, in run
    yielded = self.gen.send(value)
  File "/usr/local/lib/python3.6/site-packages/ipykernel/kernelbase.py", line 370, in dispatch_queue
    yield self.process_one()
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 346, in wrapper
    runner = Runner(result, future, yielded)
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 1080, in __init__
    self.run()
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 1147, in run
    yielded = self.gen.send(value)
  File "/usr/local/lib/python3.6/site-packages/ipykernel/kernelbase.py", line 357, in process_one
    yield gen.maybe_future(dispatch(*args))
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 326, in wrapper
    yielded = next(result)
  File "/usr/local/lib/python3.6/site-packages/ipykernel/kernelbase.py", line 267, in dispatch_shell
    yield gen.maybe_future(handler(stream, idents, msg))
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 326, in wrapper
    yielded = next(result)
  File "/usr/local/lib/python3.6/site-packages/ipykernel/kernelbase.py", line 534, in execute_request
    user_expressions, allow_stdin,
  File "/usr/local/lib/python3.6/site-packages/tornado/gen.py", line 326, in wrapper
    yielded = next(result)
  File "/usr/local/lib/python3.6/site-packages/ipykernel/ipkernel.py", line 294, in do_execute
    res = shell.run_cell(code, store_history=store_history, silent=silent)
  File "/usr/local/lib/python3.6/site-packages/ipykernel/zmqshell.py", line 536, in run_cell
    return super(ZMQInteractiveShell, self).run_cell(*args, **kwargs)
  File "/usr/local/lib/python3.6/site-packages/IPython/core/interactiveshell.py", line 2819, in run_cell
    raw_cell, store_history, silent, shell_futures)
  File "/usr/local/lib/python3.6/site-packages/IPython/core/interactiveshell.py", line 2845, in _run_cell
    return runner(coro)
  File "/usr/local/lib/python3.6/site-packages/IPython/core/async_helpers.py", line 67, in _pseudo_sync_runner
    coro.send(None)
  File "/usr/local/lib/python3.6/site-packages/IPython/core/interactiveshell.py", line 3020, in run_cell_async
    interactivity=interactivity, compiler=compiler, result=result)
  File "/usr/local/lib/python3.6/site-packages/IPython/core/interactiveshell.py", line 3191, in run_ast_nodes
    if (yield from self.run_code(code, result)):
  File "/usr/local/lib/python3.6/site-packages/IPython/core/interactiveshell.py", line 3267, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "<ipython-input-10-c8a018225115>", line 27, in <module>
    n.setup(η = η)
  File "/Users/justinalsing/Dropbox/science/delfi/master/delfi/compression/IMNN/information_maximiser/IMNN.py", line 669, in setup
    F, iC, μ, dμdθ, C = n.Fisher(output_central, output_m, output_p)
  File "/Users/justinalsing/Dropbox/science/delfi/master/delfi/compression/IMNN/information_maximiser/IMNN.py", line 465, in Fisher
    iC, μ, C = n.inverse_covariance(a)
  File "/Users/justinalsing/Dropbox/science/delfi/master/delfi/compression/IMNN/information_maximiser/IMNN.py", line 401, in inverse_covariance
    iC = tf.matrix_inverse(C, name = 'inverse_central_covariance')
  File "/usr/local/lib/python3.6/site-packages/tensorflow/python/ops/gen_linalg_ops.py", line 1041, in matrix_inverse
    "MatrixInverse", input=input, adjoint=adjoint, name=name)
  File "/usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py", line 787, in _apply_op_helper
    op_def=op_def)
  File "/usr/local/lib/python3.6/site-packages/tensorflow/python/util/deprecation.py", line 488, in new_func
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.6/site-packages/tensorflow/python/framework/ops.py", line 3274, in create_op
    op_def=op_def)
  File "/usr/local/lib/python3.6/site-packages/tensorflow/python/framework/ops.py", line 1770, in __init__
    self._traceback = tf_stack.extract_stack()

InvalidArgumentError (see above for traceback): Input is not invertible.
	 [[node inverse_central_covariance (defined at /Users/justinalsing/Dropbox/science/delfi/master/delfi/compression/IMNN/information_maximiser/IMNN.py:401)  = MatrixInverse[T=DT_FLOAT, adjoint=false, _device="/job:localhost/replica:0/task:0/device:CPU:0"](central_covariance)]]


In [None]:
fig, ax = plt.subplots(5, 1, sharex = True, figsize = (8, 14))
plt.subplots_adjust(hspace = 0)
end = len(n.history["det(F)"])
epochs = np.arange(end)
a, = ax[0].plot(epochs, n.history["det(F)"], label = 'Training data')
b, = ax[0].plot(epochs, n.history["det(test F)"], label = 'Test data')
ax[0].legend(frameon = False)
ax[0].set_ylabel(r'$|{\bf F}_{\alpha\beta}|$')
ax[1].plot(epochs, n.history["Λ"])
ax[1].plot(epochs, n.history["test Λ"])
ax[1].set_xlabel('Number of epochs')
ax[1].set_ylabel(r'$\Lambda$')
ax[1].set_xlim([0, len(epochs)]);
ax[2].plot(epochs, n.history["det(C)"])
ax[2].plot(epochs, n.history["det(test C)"])
ax[2].set_xlabel('Number of epochs')
ax[2].set_ylabel(r'$|{\bf C}|$')
ax[2].set_xlim([0, len(epochs)]);
ax[3].plot(epochs, np.array(n.history["dμdθ"]).reshape((np.prod(np.array(n.history["dμdθ"]).shape))))
ax[3].plot(epochs, np.array(n.history["test dμdθ"]).reshape((np.prod(np.array(n.history["test dμdθ"]).shape))))
ax[3].set_ylabel(r'$\partial\mu/\partial\theta$')
ax[3].set_xlabel('Number of epochs')
ax[3].set_xlim([0, len(epochs)])
ax[4].plot(epochs, np.array(n.history["μ"]).reshape((np.prod(np.array(n.history["μ"]).shape))))
ax[4].plot(epochs, np.array(n.history["test μ"]).reshape((np.prod(np.array(n.history["test μ"]).shape))))
ax[4].set_ylabel('μ')
ax[4].set_xlabel('Number of epochs')
ax[4].set_xlim([0, len(epochs)])
print()