In [None]:
# Importation
import pandas as pd
import numpy as np
import matplotlib
import matplotlib.pyplot as plt
import plotly.express as px
import tensorflow as tf

In [None]:
# Data
data = pd.read_csv('C:/Users/mnauf/Harits/Coding/covid_19_indonesia_time_series_all.csv')
data.head()

In [None]:
# choose only Jakarta
df=data.loc[data['Location'] == 'DKI Jakarta']
df1=df[['Date', 'New Cases']]
df2=df[['Date', 'New Deaths']]

In [None]:
df1.head()

In [None]:
df1.shape()

In [None]:
df2.head()

In [None]:
df2.shape()

In [None]:
# save to file
df1.to_csv('new_cases_jakarta.csv')
df2.to_csv('new_deaths_jakarta.csv')

In [None]:
# load dataset for New Cases
data1 = pd.read_csv('new_cases_jakarta.csv', header=0, index_col=0)
list_date1=data1['Date'].tolist()
list_series1=data1['New Cases'].tolist()
series1 = np.array(list_series1)
date1 = np.array(list_date1)

In [None]:
# plot column
plt.figure(figsize=(10, 6))
plot_series(date1, series1)
plt.title('New Cases Jakarta')
plt.show()

In [None]:
# load dataset for New Deaths
data2 = pd.read_csv('new_deaths_jakarta.csv', header=0, index_col=0)
list_date2 = data2['Date'].tolist()
list_series2 = data2['New Cases'].tolist()
series2 = np.array(list_series2)
date2 = np.array(list_date2)

In [None]:
# plot column
plt.figure(figsize=(10, 6))
plot_series(date2, series2)
plt.title('New Deaths Jakarta')
plt.show()

In [None]:
#Split data for training and validation
split_time = 2500
time_train = time[:split_time]
x_train = series[:split_time]
time_valid = time[split_time:]
x_valid = series[split_time:]

window_size = 30
batch_size = 32
shuffle_buffer_size = 1000

In [None]:
#Create variable to window dataset
def windowed_dataset(series, window_size, batch_size, shuffle_buffer):
    series = tf.expand_dims(series, axis=-1)
    ds = tf.data.Dataset.from_tensor_slices(series)
    ds = ds.window(window_size + 1, shift=1, drop_remainder=True)
    ds = ds.flat_map(lambda w: w.batch(window_size + 1))
    ds = ds.shuffle(shuffle_buffer)
    ds = ds.map(lambda w: (w[:-1], w[1:]))
    return ds.batch(batch_size).prefetch(1)

In [None]:
#Create variable to forecast
def model_forecast(model, series, window_size):
    ds = tf.data.Dataset.from_tensor_slices(series)
    ds = ds.window(window_size, shift=1, drop_remainder=True)
    ds = ds.flat_map(lambda w: w.batch(window_size))
    ds = ds.batch(32).prefetch(1)
    forecast = model.predict(ds)
    return forecast

In [None]:
#Find the best learning rate
tf.keras.backend.clear_session()
tf.random.set_seed(51)
np.random.seed(51)
window_size = 64
batch_size = 256
train_set = windowed_dataset(x_train, window_size, batch_size, shuffle_buffer_size)
print(train_set)
print(x_train.shape)

model = tf.keras.models.Sequential([
  tf.keras.layers.Conv1D(filters=32, kernel_size=5,
                      strides=1, padding="causal",
                      activation="relu",
                      input_shape=[None, 1]),
  tf.keras.layers.LSTM(64, return_sequences=True),
  tf.keras.layers.LSTM(64, return_sequences=True),
  tf.keras.layers.Dense(30, activation="relu"),
  tf.keras.layers.Dense(10, activation="relu"),
  tf.keras.layers.Dense(1),
  tf.keras.layers.Lambda(lambda x: x * 400)
])

lr_schedule = tf.keras.callbacks.LearningRateScheduler(
    lambda epoch: 1e-8 * 10**(epoch / 20))
optimizer = tf.keras.optimizers.SGD(lr=1e-8, momentum=0.9)
model.compile(loss=tf.keras.losses.Huber(),
              optimizer=optimizer,
              metrics=["mae"])
history = model.fit(train_set, epochs=100, callbacks=[lr_schedule])

In [None]:
#Plot graph to see each learning rate loss
plt.semilogx(history.history["lr"], history.history["loss"])
plt.axis([1e-8, 1e-4, 0, 60])

In [None]:
#Use the best learning rate to train the model
tf.keras.backend.clear_session()
tf.random.set_seed(51)
np.random.seed(51)
train_set = windowed_dataset(x_train, window_size=60, batch_size=100, shuffle_buffer=shuffle_buffer_size)
model = tf.keras.models.Sequential([
  tf.keras.layers.Conv1D(filters=60, kernel_size=5,
                      strides=1, padding="causal",
                      activation="relu",
                      input_shape=[None, 1]),
  tf.keras.layers.LSTM(60, return_sequences=True),
  tf.keras.layers.LSTM(60, return_sequences=True),
  tf.keras.layers.Dense(30, activation="relu"),
  tf.keras.layers.Dense(10, activation="relu"),
  tf.keras.layers.Dense(1),
  tf.keras.layers.Lambda(lambda x: x * 400)
])


optimizer = tf.keras.optimizers.SGD(lr=1e-5, momentum=0.9)
model.compile(loss=tf.keras.losses.Huber(),
              optimizer=optimizer,
              metrics=["mae"])
history = model.fit(train_set,epochs=150)

In [None]:
rnn_forecast = model_forecast(model, series[..., np.newaxis], window_size)
rnn_forecast = rnn_forecast[split_time - window_size:-1, -1, 0]

In [None]:
#Plot forecasted data to the validation dataset
plt.figure(figsize=(10, 6))
plot_series(time_valid, x_valid)
plot_series(time_valid, rnn_forecast)

In [None]:
#Check mean absolute error
tf.keras.metrics.mean_absolute_error(x_valid, rnn_forecast).numpy()