In [None]:
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import tensorflow as tf

In [None]:
def plot_series(time, series, format="-", start=0, end=None):
    plt.plot(time[start:end], series[start:end], format)
    plt.xlabel("Time")
    plt.ylabel("Value")
    plt.grid(True)

In [None]:
path = tf.keras.utils.get_file('sunspots.csv', 
                               '  https://storage.googleapis.com/laurencemoroney-blog.appspot.com/Sunspots.csv')
print (path)

In [None]:
df = pd.read_csv(path, index_col='Date', parse_dates=True)
df.drop(df.columns[df.columns.str.contains('unnamed',case = False)],axis = 1, inplace = True)
df.columns = ['Sunspots']   # reaname column
df.plot(figsize=(10,6))

In [None]:
series = np.array(df['Sunspots'],float)
time = np.array(df.index)
plt.figure(figsize=(10, 6))
plot_series(time, series)

In [None]:
split_time = 3000

time_train = time[:split_time]
x_train = series[:split_time]

time_valid = time[split_time:]
x_valid = series[split_time:]

In [None]:
window_size = 30
batch_size = 32
shuffle_buffer_size = 1000

In [None]:
from tensorflow.keras.preprocessing.sequence import TimeseriesGenerator

generator = TimeseriesGenerator(x_train, x_train,
                                length = window_size, sampling_rate = 1, 
                                batch_size = batch_size, shuffle = True)

In [None]:
def model_forecast(model, series, window_size):
    ds = tf.data.Dataset.from_tensor_slices(series)
    ds = ds.window(window_size, shift=1, drop_remainder=True)
    ds = ds.flat_map(lambda w: w.batch(window_size))
    ds = ds.batch(32).prefetch(1)
    forecast = model.predict(ds)
    return forecast

In [None]:
tf.keras.backend.clear_session()
tf.random.set_seed(51)
np.random.seed(51)

In [None]:
window_size = 64
batch_size = 256
n_features = 1

In [None]:
# needed for lstm model.
x_train = x_train.reshape((len(x_train), n_features))

In [None]:
generator = TimeseriesGenerator(x_train, x_train,
                                length = window_size, sampling_rate = 1, 
                                batch_size = batch_size, shuffle=True)

In [None]:
model = tf.keras.models.Sequential([
  tf.keras.layers.Conv1D(filters=32, kernel_size=5,
                      strides=1, padding="causal",
                      activation="relu",
                      input_shape=[None, 1]),
  tf.keras.layers.LSTM(64, return_sequences=True),
  tf.keras.layers.LSTM(64, return_sequences=True),
  tf.keras.layers.Dense(30, activation="relu"),
  tf.keras.layers.Dense(10, activation="relu"),
  tf.keras.layers.Dense(1),
  tf.keras.layers.Lambda(lambda x: x * 400)
])

In [None]:
model.summary()

In [None]:
lr_schedule = tf.keras.callbacks.LearningRateScheduler(lambda epoch: 1e-8 * 10**(epoch / 20))

In [None]:
optimizer = tf.keras.optimizers.SGD(lr=1e-8, momentum=0.9)

In [None]:
model.compile(loss=tf.keras.losses.Huber(),
              optimizer=optimizer,
              metrics=["mae"])

In [None]:
history = model.fit(generator, epochs=100, callbacks=[lr_schedule])

In [None]:
plt.semilogx(history.history["lr"], history.history["loss"])
plt.axis([1e-8, 1e-4, 0, 60])

In [None]:
tf.keras.backend.clear_session()
tf.random.set_seed(51)
np.random.seed(51)

In [None]:
window_size = 64
batch_size = 256

In [None]:
generator = TimeseriesGenerator(x_train, x_train,
                                length = window_size, sampling_rate = 1, 
                                batch_size = batch_size, shuffle=True)

In [None]:
# needed for lstm model.
x_train = x_train.reshape((len(x_train), n_features))

In [None]:
model = tf.keras.models.Sequential([
  tf.keras.layers.Conv1D(filters=60, kernel_size = 5,
                      strides=1, padding="causal",
                      activation="relu",
                      input_shape=[None, 1]),
  tf.keras.layers.LSTM(60, return_sequences=True),
  tf.keras.layers.LSTM(60, return_sequences=True),
  tf.keras.layers.Dense(30, activation="relu"),
  tf.keras.layers.Dense(10, activation="relu"),
  tf.keras.layers.Dense(1),
  tf.keras.layers.Lambda(lambda x: x * 400)
])

In [None]:
model.summary()

In [None]:
# using optimal lr from the first model's graph
optimizer = tf.keras.optimizers.SGD(lr=1e-5, momentum=0.9)

In [None]:
model.compile(loss=tf.keras.losses.Huber(),
              optimizer=optimizer,
              metrics=["mae"])

In [None]:
history = model.fit(generator,epochs=500)

In [None]:
# We need to make it 2 dimimention - because RNN needs 3D
series_2d = np.array(df['Sunspots'],float)
print(series_2d.shape)
series_2d = series_2d.reshape((len(series_2d), n_features))
print(series_2d.shape)

In [None]:
rnn_forecast=[]
for time in range(len(series_2d) - window_size):
  rnn_forecast.append(model.predict(series_2d[time : time + window_size][np.newaxis]))

rnn_forecast = rnn_forecast[split_time-n_input:]
rnn_forecast = np.array(rnn_forecast)[:, 0, 0]
rnn_forecast.shape

plt.figure(figsize=(10, 6))

plot_series(time_valid, x_valid)
plot_series(time_valid, rnn_forecast)

In [None]:
rnn_forecast_x = model_forecast(model, series_2d[..., np.newaxis], window_size)

In [None]:
rnn_forecast_x = rnn_forecast_x[split_time - window_size:-1, -1, 0]

In [None]:
plt.figure(figsize=(10, 6))
plot_series(time_valid, x_valid)
plot_series(time_valid, rnn_forecast)

In [None]:
tf.keras.metrics.mean_absolute_error(x_valid, rnn_forecast).numpy()

In [None]:
import matplotlib.image  as mpimg
import matplotlib.pyplot as plt

#-----------------------------------------------------------
# Retrieve a list of list results on training and test data
# sets for each training epoch
#-----------------------------------------------------------
loss=history.history['loss']

epochs=range(len(loss)) # Get number of epochs

#------------------------------------------------
# Plot training and validation loss per epoch
#------------------------------------------------
plt.plot(epochs, loss, 'r')
plt.title('Training loss')
plt.xlabel("Epochs")
plt.ylabel("Loss")
plt.legend(["Loss"])

plt.figure()

zoomed_loss = loss[200:]
zoomed_epochs = range(200,500)

#------------------------------------------------
# Plot training and validation loss per epoch
#------------------------------------------------
plt.plot(zoomed_epochs, zoomed_loss, 'r')
plt.title('Training loss')
plt.xlabel("Epochs")
plt.ylabel("Loss")
plt.legend(["Loss"])

plt.figure()

In [None]:
#print(rnn_forecast)