In [1]:
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
%matplotlib notebook
import time
import datetime

#Save experiment begin date
current_time = datetime.datetime.now()
print("Current_date: "+str(current_time))
current_time = "".join(current_time.strftime("%x").split('/'))


#Import usual things required for graph nets
import numpy as np
import pandas as pd
import networkx as nx
import sonnet as snt
import tensorflow as tf
import os
import sys
from matplotlib import pyplot as plt
from matplotlib import animation
import seaborn as sns

#Import graph nets
from graph_nets import blocks
from graph_nets import utils_tf
from graph_nets import utils_np
from graph_nets.demos import models

#Path to the scripts shared troughout phases
parent_path=os.path.abspath('..')
path_common =  '/'.join(parent_path.split('/')[:-1])
path_common = os.path.join(path_common,'Common','Scripts')
#Check if path exists
if(not os.path.exists(path_common)):
    print('The path: '+ os.path.exists(path_common)+' is not found!')
#Add shared scripts to our current paths for importing
sys.path.insert(0, path_common)

#Define base path
base = os.path.join(parent_path,'Not_Moving_RigidBody','one_way_varying_sizes')
if(not os.path.exists(base)):
        os.mkdir(base) 
    
#Path to saved models and trajectories
path_saves = os.path.join(base,'Saves')
if(not os.path.exists(path_saves)):
        os.mkdir(path_saves) 
#Path to plots
path_plots = os.path.join(base,'Plots')
if(not os.path.exists(path_plots)):
        os.mkdir(path_plots) 
#Path to animations
path_animations = os.path.join(base,'Animations')
if(not os.path.exists(path_animations)):
        os.mkdir(path_animations)
        
#Change here
num_training_iterations = 20000
batch_size_tr = 256
batch_size_ge = 100
num_time_steps = 50

desc = "ntr="+str(num_training_iterations)
desc = desc +"_btr="+str(batch_size_tr)
desc = desc +"_bge="+str(batch_size_ge)
desc = desc +"date="+str(current_time)

#Set seed to 1 for reproduceability
SEED = 1
np.random.seed(SEED)
tf.set_random_seed(SEED)

Current_date: 2020-02-07 20:05:20.830953

The TensorFlow contrib module will not be included in TensorFlow 2.0.
For more information, please see:
  * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md
  * https://github.com/tensorflow/addons
  * https://github.com/tensorflow/io (for I/O related ops)
If you depend on functionality not listed there, please file an issue.



## Import functions

In [2]:
#Import functions for simulating
from Simulation_Functions_extended import SpringMassSimulator, generate_trajectory, roll_out_physics
#Import functions for creating graph
from Graph_creator_functions import rigid_rectangle_graph_extended
#Import visualisation functions

## Define loss functions

In [3]:
def create_loss_ops(target_op, output_ops):
    """Create supervised loss operations from targets and outputs.

    Args:
        target_op: The target velocity tf.Tensor.
        output_ops: The list of output graphs from the model.

    Returns:
        A list of loss values (tf.Tensor), one per output op.""" 
    loss_ops = [
            tf.reduce_mean(
            tf.reduce_sum((tf.cast(output_op.nodes,tf.float64) - tf.cast(target_op[..., 2:4],tf.float64))**2, axis=-1))
            for output_op in output_ops
    ]
    return loss_ops


def make_all_runnable_in_session(*args):
    """Apply make_runnable_in_session to an iterable of graphs."""
    return [utils_tf.make_runnable_in_session(a) for a in args]

# Define the Model

In [4]:
tf.reset_default_graph()
# Create the model.
model = models.EncodeProcessDecode(node_output_size=2)






# Training the Network: Chain
## Generate:
- Model
- Training trajectory 5 to 9 masses
- Generalization trajectories: 4 mass, 9 mass

In [5]:
#@title Set up model training and evaluation  { form-width: "30%" }

# The model we explore includes three components:
# - An "Encoder" graph net, which independently encodes the edge, node, and
#   global attributes (does not compute relations etc.).
# - A "Core" graph net, which performs N rounds of processing (message-passing)
#   steps. The input to the Core is the concatenation of the Encoder's output
#   and the previous output of the Core (labeled "Hidden(t)" below, where "t" is
#   the processing step).
# - A "Decoder" graph net, which independently decodes the edge, node, and
#   global attributes (does not compute relations etc.), on each
#   message-passing step.
#
#                     Hidden(t)   Hidden(t+1)
#                        |            ^
#           *---------*  |  *------*  |  *---------*
#           |         |  |  |      |  |  |         |
# Input --->| Encoder |  *->| Core |--*->| Decoder |---> Output(t)
#           |         |---->|      |     |         |
#           *---------*     *------*     *---------*
#
# The model is trained by supervised learning. Input mass-spring systems are
# procedurally generated, where the nodes represent the positions, velocities,
# and indicators of whether the mass is fixed in space or free to move, the
# edges represent the spring constant and spring rest length, and the global
# attribute represents the variable coefficient of gravitational acceleration.
# The outputs/targets have the same structure, with the nodes representing the
# masses' next-step states.
#
# The training loss is computed on the output of each processing step. The
# reason for this is to encourage the model to try to solve the problem in as
# few steps as possible. It also helps make the output of intermediate steps
# more interpretable.
#
# There's no need for a separate evaluate dataset because the inputs are
# never repeated, so the training loss is the measure of performance on graphs
# from the input distribution.
#
# We also evaluate how well the models generalize to systems which are one mass
# larger, and smaller, than those from the training distribution. The loss is
# computed as the mean over a 50-step rollout, where each step's input is the
# the previous step's output.
#
# Variables with the suffix _tr are training parameters, and variables with the
# suffix _ge are test/generalization parameters.
#
# After around 10000-20000 training iterations the model reaches good
# performance on mass-spring systems with 5-8 masses.


rand = np.random.RandomState(SEED)

# Model parameters.
num_processing_steps_tr = 1
num_processing_steps_ge = 1

# Data / training parameters.
#num_training_iterations = 3000
#batch_size_tr = 256
#batch_size_ge = 100
#num_time_steps = 50
step_size = 0.1



# Data.
# Base graphs for training.

len_a_mix_max = (1,7)
len_b_mix_max = (14,20)

len_as = rand.randint(*len_a_mix_max, size=batch_size_tr)
len_bs = rand.randint(*len_b_mix_max, size=batch_size_tr)

static_graph_tr = [rigid_rectangle_graph_extended(len_a,len_b, 50., 1, 0.,True) for len_a,len_b in zip(len_as,len_bs)]
base_graph_tr =  utils_tf.data_dicts_to_graphs_tuple(static_graph_tr)

# Base graphs for testing.

# Different sized rectangles.
base_graph_ge = utils_tf.data_dicts_to_graphs_tuple([rigid_rectangle_graph_extended(5, 20, 50., 1, 0.,True)] * batch_size_ge)

# True physics simulator for data generation.
simulator = SpringMassSimulator(step_size=step_size)
# Training.
# Generate a training trajectory by adding noise to initial
# position, spring constants and gravity
initial_conditions_tr, true_trajectory_tr = generate_trajectory(
    simulator,
    base_graph_tr,
    num_time_steps,
    step_size,
    node_noise_level=0.04,
    edge_noise_level=5.0,
    global_noise_level=1.0,
    do_set_rest=True,do_apply_gravity=True)
# Random start step.
t = tf.random_uniform([], minval=0, maxval=num_time_steps - 1, dtype=tf.int32)
input_graph_tr = initial_conditions_tr.replace(nodes=true_trajectory_tr[t])
target_nodes_tr = true_trajectory_tr[t + 1]

output_ops_tr = model(input_graph_tr, num_processing_steps_tr)

# Test data: 4-mass string.
initial_conditions_ge, _ = generate_trajectory(
    lambda x: model(x, num_processing_steps_ge),
    base_graph_ge,
    num_time_steps,
    step_size,
    node_noise_level=0.04,
    edge_noise_level=5.0,
    global_noise_level=1.0,
    do_set_rest=True,do_apply_gravity=True)
_, true_nodes_rollout_ge = roll_out_physics(
    simulator, initial_conditions_ge, num_time_steps, step_size)
_, predicted_nodes_rollout_ge = roll_out_physics(
    lambda x: model(x, num_processing_steps_ge), initial_conditions_ge,
    num_time_steps, step_size)

# Training loss.
loss_ops_tr = create_loss_ops(target_nodes_tr, output_ops_tr)
# Training loss across processing steps.
loss_op_tr = sum(loss_ops_tr) / num_processing_steps_tr
# Test/generalization loss.
loss_op_ge = tf.reduce_mean(
    tf.reduce_sum(
        (predicted_nodes_rollout_ge[..., 2:4] -
         true_nodes_rollout_ge[..., 2:4])**2,
        axis=-1))

# Optimizer.
learning_rate = 1e-3
optimizer = tf.train.AdamOptimizer(learning_rate)
step_op = optimizer.minimize(loss_op_tr)

input_graph_tr = make_all_runnable_in_session(input_graph_tr)
initial_conditions_ge = make_all_runnable_in_session(initial_conditions_ge)

Instructions for updating:
Use tf.where in 2.0, which has the same broadcast rule as np.where


Instructions for updating:
Call initializer instance with the dtype argument instead of passing it to the constructor
Instructions for updating:
Call initializer instance with the dtype argument instead of passing it to the constructor



### Reset Tensorflow session, but keep the same computational graph.

In [6]:
#@title Reset session  { form-width: "30%" }


saver = tf.train.Saver()
# This cell resets the 
try:
    sess.close()
except NameError:
    pass
sess = tf.Session()
sess.run(tf.global_variables_initializer())

var = [v for v in tf.trainable_variables() if v.name == 'MLPGraphNetwork/graph_network/edge_block/mlp/linear_0/w:0']
pre_train_np = sess.run(var)
print(pre_train_np)


last_iteration = 0
logged_iterations = []
losses_tr = []
losses_ge = []

[array([[-0.03804378, -0.02842822, -0.0177331 , ..., -0.04071054,
         0.07211056, -0.0120081 ],
       [-0.06830946,  0.14129351,  0.04931194, ...,  0.00310976,
        -0.02770088, -0.07372261],
       [ 0.11897311, -0.10758854, -0.02762611, ...,  0.03443757,
         0.05117009, -0.05914008],
       ...,
       [ 0.16938609, -0.01587653, -0.03111833, ...,  0.1654855 ,
         0.15000105, -0.0039337 ],
       [-0.03774908,  0.10090108, -0.03598287, ...,  0.04738074,
        -0.1002662 , -0.02604311],
       [ 0.08875753,  0.14404969,  0.03646467, ...,  0.08237012,
        -0.06607509, -0.05425633]], dtype=float32)]


### Train Network

In [7]:
#@title Run training  { form-width: "30%" }

# You can interrupt this cell's training loop at any time, and visualize the
# intermediate results by running the next cell (below). You can then resume
# training by simply executing this cell again.

# How much time between logging and printing the current results.
log_every_seconds = 5

print("# (iteration number), T (elapsed seconds), "
      "Ltr (training 1-step loss), "
      "Lge (test/generalization rollout loss)")

start_time = time.time()
last_log_time = start_time
for iteration in range(last_iteration, num_training_iterations):
    last_iteration = iteration
    train_values = sess.run({
        "step": step_op,
        "loss": loss_op_tr,
        "input_graph": input_graph_tr,
        "target_nodes": target_nodes_tr,
        "outputs": output_ops_tr
    })
    the_time = time.time()
    elapsed_since_last_log = the_time - last_log_time
    if elapsed_since_last_log > log_every_seconds:
        last_log_time = the_time
        test_values = sess.run({
            "loss_ge": loss_op_ge,
            "true_rollout_ge": true_nodes_rollout_ge,
            "predicted_rollout_ge": predicted_nodes_rollout_ge,
        })
        elapsed = time.time() - start_time
        losses_tr.append(train_values["loss"])
        losses_ge.append(test_values["loss_ge"])
        logged_iterations.append(iteration)
        print("# {:05d}, T {:.1f}, Ltr {:.4f}, Lge {:.4f}".format(
            iteration, elapsed, train_values["loss"], test_values["loss_ge"]))

# (iteration number), T (elapsed seconds), Ltr (training 1-step loss), Lge (test/generalization rollout loss)
# 00217, T 5.3, Ltr 0.7187, Lge 0.5718
# 00458, T 10.1, Ltr 0.0924, Lge 0.7616
# 00713, T 15.1, Ltr 0.1025, Lge 1.6421
# 00968, T 20.1, Ltr 0.0203, Lge 0.4505
# 01225, T 25.1, Ltr 0.0701, Lge 0.4733
# 01484, T 30.1, Ltr 0.0399, Lge 0.5478
# 01740, T 35.1, Ltr 0.0117, Lge 0.4046
# 01999, T 40.1, Ltr 0.0180, Lge 1.6745
# 02255, T 45.1, Ltr 0.0127, Lge 0.3280
# 02508, T 50.1, Ltr 0.0166, Lge 0.3819
# 02763, T 55.1, Ltr 0.0189, Lge 0.3327
# 03020, T 60.1, Ltr 0.0273, Lge 0.4237
# 03276, T 65.1, Ltr 0.0133, Lge 0.3883
# 03531, T 70.2, Ltr 0.0285, Lge 2.0098
# 03787, T 75.2, Ltr 0.0111, Lge 0.3457
# 04044, T 80.2, Ltr 0.0144, Lge 0.4865
# 04302, T 85.2, Ltr 0.0137, Lge 0.5259
# 04557, T 90.2, Ltr 0.0063, Lge 0.3155
# 04814, T 95.2, Ltr 0.0064, Lge 0.3168
# 05068, T 100.2, Ltr 0.0065, Lge 0.2694
# 05325, T 105.2, Ltr 0.0083, Lge 0.1998
# 05583, T 110.3, Ltr 0.0053, Lge 0.1447
# 05841,

In [8]:
var = [v for v in tf.trainable_variables() if v.name == 'MLPGraphNetwork/graph_network/edge_block/mlp/linear_0/w:0']
post_train_np = sess.run(var)
print(np.array(post_train_np)-np.array(pre_train_np))

[[[-0.01543435 -0.03472479 -0.01982524 ...  0.03471715 -0.06789981
    0.00987422]
  [ 0.00213377  0.02425139 -0.00798688 ... -0.16754334  0.091775
    0.07238264]
  [ 0.081834   -0.02096055  0.05293066 ...  0.06618313  0.004441
   -0.01698746]
  ...
  [-0.00108035 -0.01607736  0.01475503 ...  0.09446809 -0.03089446
    0.00075264]
  [ 0.00269017 -0.03350035  0.01444349 ...  0.12298305  0.02015655
   -0.02443589]
  [ 0.0655745  -0.03531352  0.02579173 ...  0.08006177  0.02207464
   -0.03439967]]]


## Save Model

In [9]:
if os.path.exists(os.path.join(path_saves, desc, "model.ckpt")):
    print("The file: "+ "model.ckpt" + "already exists. Delete it before saving a new trajectory!")
else:
    if not os.path.exists(os.path.join(path_saves, desc)):
        os.mkdir(os.path.join(path_saves, desc)) 
    save_path = saver.save(sess, os.path.join(path_saves, desc)+"/model.ckpt")
    print("Model saved in path: %s" % save_path)
        
        



Model saved in path: /home/bence/git_workspace/Dyadic_Collaboration/Graph_Networks/Phases/Phase1/Not_Moving_RigidBody/Simple_one_way_varying_sizes/Saves/ntr=20000_btr=256_bge=100date=020720/model.ckpt


## Load Model (Optional)

In [None]:
saver.restore(sess,os.path.join(path_saves, "ntr=3000_btr=256_bge=100date=020620")+"/model.ckpt")

var = [v for v in tf.trainable_variables() if v.name == 'MLPGraphNetwork/graph_network/edge_block/mlp/linear_0/w:0']
post_restore_np = sess.run(var)
print(np.array(post_restore_np))

## Save Trajectories

In [12]:
#Describe the experiment


def get_node_trajectories(rollout_array, batch_size):
    return np.split(rollout_array[..., :2], batch_size, axis=1)

#Store the data
true_rollouts = get_node_trajectories(test_values["true_rollout_ge"],batch_size_ge)
true_trajectory_np = np.array(true_rollouts)

predicted_rollouts = get_node_trajectories(test_values["predicted_rollout_ge"],batch_size_ge)
predicted_trajectory_np=np.array(predicted_rollouts)


l_names = ["true_trajectory.npy",
           "predicted_trajectory.npy"]

l_data = [true_trajectory_np,
          predicted_trajectory_np]


for fname, fdata in zip(l_names,l_data):
    if os.path.exists(os.path.join(path_saves, desc, fname)):
        print("The file: "+ fname + "already exists. Delete it before saving a new trajectory!")
    else:
        if not os.path.exists(os.path.join(path_saves, desc)):
            os.mkdir(os.path.join(path_saves, desc)) 
        np.save(os.path.join(path_saves, desc, fname), fdata)

In [16]:
# Choose a simulated system
true_trajectory_np = true_trajectory_np[-1]

predicted_trajectory_np = predicted_trajectory_np[-1]

[[ -3.8663747  -23.787111  ]
 [ -1.7713808   15.877946  ]
 [  6.013218   -24.701296  ]
 [  8.246057    15.340458  ]
 [  0.03780567   0.0290212 ]]


## Plot and Save Convergence plot

In [14]:
fig = plt.figure(1, figsize=(12, 3))
fig.clf()
x = np.array(logged_iterations)


# Next-step Loss.
y = losses_tr
ax = fig.add_subplot(1, 2, 1)
ax.plot(x, y, "k")
ax.set_title("Next step loss: Training")

# Rollout 5 loss.
y = losses_ge
ax = fig.add_subplot(1, 2, 2)
ax.plot(x, y, "k")
ax.set_title("Rollout loss: Generalisation")


batch_size_tr = 256
batch_size_ge = 100


#Save figure
if os.path.exists(os.path.join(path_plots,desc,"ConvergencePlot.png")):
    print("The file: "+ "ConvergencePlot.png" + "already exists. Delete it before saving a new plot!")
else:
    if not os.path.exists(os.path.join(path_plots, desc)):
        os.mkdir(os.path.join(path_plots, desc))
                  
    fig.savefig("Plots/"+desc+"/ConvergencePlot.png")

<IPython.core.display.Javascript object>

## Plot and Save Trajectories Error plot

### 4 masses 

In [15]:
# Visualize trajectories
plt.close('all')
fig_animate3 = plt.figure(1, figsize=(5, 5))
ax3 = fig_animate3.add_subplot(1, 1, 1)

# Visualize trajectories
dots = []
dots1 = []

num_nodes = true_trajectory_np.shape[1]
    
def init():
    for i in range(num_nodes):
        if(i==0):
            dots.append(ax3.plot([], [], linestyle='none', marker='o', markersize=5, color="r",label="Truth"))
            dots1.append(ax3.plot([], [], linestyle='none', marker='o', markersize=5, color="k",label="Prediction"))
        else:
            dots.append(ax3.plot([], [], linestyle='none', marker='o', markersize=5, color="r"))
            dots1.append(ax3.plot([], [], linestyle='none', marker='o', markersize=5, color="k"))
  
    return dots,dots1
    
ax3.set_xlim(-10, 10)
ax3.set_ylim(-10, 10)


def animate(z):
    for i in range(num_nodes):
        dots[i][0].set_data(true_trajectory_np[z,i,0],true_trajectory_np[z,i,1])
        dots1[i][0].set_data(predicted_trajectory_np[z,i,0],predicted_trajectory_np[z,i,1])
    legend = ax3.legend()
    return dots, dots1, legend



anim = animation.FuncAnimation(fig_animate3, animate,init_func = init, interval = step_size * 1000, frames=num_time_steps, blit=False, repeat=True)
#Save animation
if os.path.exists(os.path.join(path_animations,desc,"FullRollout","trajectory_masses.gif")):
    print("The file: "+ "trajectory_masses.gif" + "already exists. Delete it before saving a new animation!")
else:
    if not os.path.exists(os.path.join(path_animations, desc)):
        os.mkdir(os.path.join(path_animations, desc))
        if not os.path.exists(os.path.join(path_animations, desc,"FullRollout")):
            os.mkdir(os.path.join(path_animations, desc,"FullRollout"))
                  
    anim.save('Animations/'+desc+'/FullRollout/trajectory_masses.gif', writer='imagemagick', fps=20)

ax3.set_title("Trajectory for generalisation")
ax3.set_xlabel("x")
ax3.set_ylabel("y")
plt.show()

<IPython.core.display.Javascript object>