In [1]:
# QUESTION
#
# For this task you will need to train a neural network
# to predict sunspot activity using the Sunspots.csv dataset.
# Your neural network must  have an MAE
# of 0.12 or less on the normalized dataset for top marks.
# Code for normalizing the data is provided and should not be changed.
# At the bottom of this file, we provide  some testing
# code should you want to check your model.

# Note: Do not use lambda layers in your model, they are not supported
# on the grading infrastructure.
# <번역> 
# 이 작업을 위해서는 신경망을 훈련시켜야합니다.
# Sunspots.csv 데이터 세트를 사용하여 흑점 활동을 예측합니다.
# 상위 마크에 대한 정규화 된 데이터 세트에서 0.12 이하의 MAE가 있어야합니다.
# 데이터 정규화를위한 코드가 제공되며 변경해서는 안됩니다.
# 당신의 모델을 체크하려면, 이 파일의 맨 아래에 몇 가지 테스팅 코드가 있습니다.
# 참고 : 모델에서 람다 레이어를 사용하지 마십시오. 채점 인프라에서 지원되지 않습니다.
 


import csv
import tensorflow as tf
import numpy as np
import urllib
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Conv1D, LSTM 
from tensorflow.keras.optimizers import SGD, RMSprop
from tensorflow.keras.losses import Huber
from tensorflow.keras.callbacks import ModelCheckpoint


# DO NOT CHANGE THIS CODE
def windowed_dataset(series, window_size, batch_size, shuffle_buffer):
    series = tf.expand_dims(series, axis=-1)
    ds = tf.data.Dataset.from_tensor_slices(series)
    ds = ds.window(window_size + 1, shift=1, drop_remainder=True)
    ds = ds.flat_map(lambda w: w.batch(window_size + 1))
    ds = ds.shuffle(shuffle_buffer)
    ds = ds.map(lambda w: (w[:-1], w[1:]))
    return ds.batch(batch_size).prefetch(1)


def solution_model():
    url = 'https://storage.googleapis.com/download.tensorflow.org/data/Sunspots.csv'
    urllib.request.urlretrieve(url, 'sunspots.csv')

    time_step = []
    sunspots = []

    with open('sunspots.csv') as csvfile:
        reader = csv.reader(csvfile, delimiter=',')
        next(reader)
        for row in reader:
            sunspots.append(float(row[2]))   # YOUR CODE HERE
            time_step.append(int(row[0]))  # YOUR CODE HERE

    series =  np.array(sunspots)# YOUR CODE HERE

    # DO NOT CHANGE THIS CODE
    # This is the normalization function
    min = np.min(series)
    max = np.max(series)
    series -= min
    series /= max
    time = np.array(time_step)

    # The data should be split into training and validation sets at time step 3000
    # DO NOT CHANGE THIS CODE
    split_time = 3000


    time_train = time[:split_time]# YOUR CODE HERE
    x_train = series[:split_time]# YOUR CODE HERE
    time_valid = time[split_time:]# YOUR CODE HERE
    x_valid = series[split_time:] # YOUR CODE HERE

    # DO NOT CHANGE THIS CODE
    window_size = 30
    batch_size = 32
    shuffle_buffer_size = 1000

    train_set = windowed_dataset(x_train, window_size=window_size, batch_size=batch_size, shuffle_buffer=shuffle_buffer_size)
    valid_set = windowed_dataset(x_valid, window_size=window_size, batch_size=batch_size, shuffle_buffer=shuffle_buffer_size)

    model = tf.keras.models.Sequential([
        Conv1D(60, kernel_size=5, padding='causal', activation='relu', input_shape=[None,1]),
        LSTM(60,return_sequences=True),
        LSTM(60, return_sequences=True),
        Dense(30, activation='relu'),
        Dense(10, activation='relu'),                                  
        # YOUR CODE HERE. Whatever your first layer is, the input shape will be [None,1] when using the Windowed_dataset above, depending on the layer type chosen
        tf.keras.layers.Dense(1)
    ])
    opt = SGD(lr=1e-5, momentum=0.9)
    model.compile(loss=Huber(), optimizer=opt, metrics=['mae'])
    
    checkpoint_path = 'sunset_checkpoint1.ckpt'
    checkpoint = ModelCheckpoint(filepath = checkpoint_path, save_weights_only=True, save_best_only=True, 
                                monitor='val_mae', verbose=1)
    model.fit(train_set, validation_data = (valid_set), epochs=100, callbacks=[checkpoint])
    model.load_weights(checkpoint_path)
    # YOUR CODE HERE TO COMPILE AND TRAIN THE MODEL
    return model


# Note that you'll need to save your model as a .h5 like this.
# When you press the Submit and Test button, this .h5 model will be
# sent to the testing infrastructure for scoring.

# You must use the Submit and Test button to submit your model
# at least once in each category before you finally submit your exam.

if __name__ == '__main__':
    model = solution_model()
    model.save("cat5_sunspots(typeB).h5")



# THIS CODE IS USED IN THE TESTER FOR FORECASTING. IF YOU WANT TO TEST YOUR MODEL
# BEFORE UPLOADING YOU CAN DO IT WITH THIS
#def model_forecast(model, series, window_size):
#    ds = tf.data.Dataset.from_tensor_slices(series)
#    ds = ds.window(window_size, shift=1, drop_remainder=True)
#    ds = ds.flat_map(lambda w: w.batch(window_size))
#    ds = ds.batch(32).prefetch(1)
#    forecast = model.predict(ds)
#    return forecast


#window_size = # YOUR CODE HERE
#rnn_forecast = model_forecast(model, series[..., np.newaxis], window_size)
#rnn_forecast = rnn_forecast[split_time - window_size:-1, -1, 0]

#result = tf.keras.metrics.mean_absolute_error(x_valid, rnn_forecast).numpy()

## To get the maximum score, your model must have an MAE OF .12 or less.
## When you Submit and Test your model, the grading infrastructure
## converts the MAE of your model to a score from 0 to 5 as follows:

#test_val = 100 * result
#score = math.ceil(17 - test_val)
#if score > 5:
#    score = 5

#print(score)

Epoch 1/100
     92/Unknown - 1s 14ms/step - loss: 0.0320 - mae: 0.1923
Epoch 00001: val_mae improved from inf to 0.16108, saving model to sunset_checkpoint1.ckpt
Epoch 2/100
Epoch 00002: val_mae improved from 0.16108 to 0.15523, saving model to sunset_checkpoint1.ckpt
Epoch 3/100
Epoch 00003: val_mae improved from 0.15523 to 0.15014, saving model to sunset_checkpoint1.ckpt
Epoch 4/100
Epoch 00004: val_mae improved from 0.15014 to 0.14562, saving model to sunset_checkpoint1.ckpt
Epoch 5/100
Epoch 00005: val_mae improved from 0.14562 to 0.14137, saving model to sunset_checkpoint1.ckpt
Epoch 6/100
Epoch 00006: val_mae improved from 0.14137 to 0.13755, saving model to sunset_checkpoint1.ckpt
Epoch 7/100
Epoch 00007: val_mae improved from 0.13755 to 0.13417, saving model to sunset_checkpoint1.ckpt
Epoch 8/100
Epoch 00008: val_mae improved from 0.13417 to 0.13110, saving model to sunset_checkpoint1.ckpt
Epoch 9/100
Epoch 00009: val_mae improved from 0.13110 to 0.12844, saving model to sunse

Epoch 28/100
Epoch 00028: val_mae improved from 0.10697 to 0.10660, saving model to sunset_checkpoint1.ckpt
Epoch 29/100
Epoch 00029: val_mae improved from 0.10660 to 0.10630, saving model to sunset_checkpoint1.ckpt
Epoch 30/100
Epoch 00030: val_mae improved from 0.10630 to 0.10605, saving model to sunset_checkpoint1.ckpt
Epoch 31/100
Epoch 00031: val_mae improved from 0.10605 to 0.10584, saving model to sunset_checkpoint1.ckpt
Epoch 32/100
Epoch 00032: val_mae improved from 0.10584 to 0.10568, saving model to sunset_checkpoint1.ckpt
Epoch 33/100
Epoch 00033: val_mae improved from 0.10568 to 0.10555, saving model to sunset_checkpoint1.ckpt
Epoch 34/100
Epoch 00034: val_mae improved from 0.10555 to 0.10544, saving model to sunset_checkpoint1.ckpt
Epoch 35/100
Epoch 00035: val_mae improved from 0.10544 to 0.10536, saving model to sunset_checkpoint1.ckpt
Epoch 36/100
Epoch 00036: val_mae improved from 0.10536 to 0.10531, saving model to sunset_checkpoint1.ckpt
Epoch 37/100
Epoch 00037: va

Epoch 58/100
Epoch 00058: val_mae did not improve from 0.10528
Epoch 59/100
Epoch 00059: val_mae did not improve from 0.10528
Epoch 60/100
Epoch 00060: val_mae did not improve from 0.10528
Epoch 61/100
Epoch 00061: val_mae did not improve from 0.10528
Epoch 62/100
Epoch 00062: val_mae did not improve from 0.10528
Epoch 63/100
Epoch 00063: val_mae did not improve from 0.10528
Epoch 64/100
Epoch 00064: val_mae did not improve from 0.10528
Epoch 65/100
Epoch 00065: val_mae did not improve from 0.10528
Epoch 66/100
Epoch 00066: val_mae did not improve from 0.10528
Epoch 67/100
Epoch 00067: val_mae did not improve from 0.10528
Epoch 68/100
Epoch 00068: val_mae did not improve from 0.10528
Epoch 69/100
Epoch 00069: val_mae did not improve from 0.10528
Epoch 70/100
Epoch 00070: val_mae did not improve from 0.10528
Epoch 71/100
Epoch 00071: val_mae did not improve from 0.10528
Epoch 72/100
Epoch 00072: val_mae did not improve from 0.10528
Epoch 73/100
Epoch 00073: val_mae did not improve from 

Epoch 90/100
Epoch 00090: val_mae did not improve from 0.10528
Epoch 91/100
Epoch 00091: val_mae did not improve from 0.10528
Epoch 92/100
Epoch 00092: val_mae did not improve from 0.10528
Epoch 93/100
Epoch 00093: val_mae did not improve from 0.10528
Epoch 94/100
Epoch 00094: val_mae did not improve from 0.10528
Epoch 95/100
Epoch 00095: val_mae did not improve from 0.10528
Epoch 96/100
Epoch 00096: val_mae did not improve from 0.10528
Epoch 97/100
Epoch 00097: val_mae did not improve from 0.10528
Epoch 98/100
Epoch 00098: val_mae did not improve from 0.10528
Epoch 99/100
Epoch 00099: val_mae did not improve from 0.10528
Epoch 100/100
Epoch 00100: val_mae did not improve from 0.10528


In [3]:
# <참고용코드-모델의 성능을 테스트하기 위한 코드 5등급 ok> #
# 이부분은 절대 답으로 포함시키지 마세요 #
# THIS CODE IS USED IN THE TESTER FOR FORECASTING. IF YOU WANT TO TEST YOUR MODEL
# BEFORE UPLOADING YOU CAN DO IT WITH THIS
import math
url = 'https://storage.googleapis.com/download.tensorflow.org/data/Sunspots.csv'
urllib.request.urlretrieve(url, 'sunspots.csv')

time_step = []
sunspots = []

with open('sunspots.csv') as csvfile:
    reader = csv.reader(csvfile, delimiter=',')
    next(reader)
    for row in reader:
        sunspots.append(float(row[2]))   # YOUR CODE HERE
        time_step.append(int(row[0]))  # YOUR CODE HERE

series =  np.array(sunspots)# YOUR CODE HERE

# DO NOT CHANGE THIS CODE
# This is the normalization function
min = np.min(series)
max = np.max(series)
series -= min
series /= max
time = np.array(time_step)
split_time = 3000
time_train = time[:split_time]# YOUR CODE HERE
x_train = series[:split_time]# YOUR CODE HERE
time_valid = time[split_time:]# YOUR CODE HERE
x_valid = series[split_time:] # YOUR CODE HERE

# DO NOT CHANGE THIS CODE
window_size = 30
batch_size = 32
shuffle_buffer_size = 1000
    
def model_forecast(model, series, window_size):
    ds = tf.data.Dataset.from_tensor_slices(series)
    ds = ds.window(window_size, shift=1, drop_remainder=True)
    ds = ds.flat_map(lambda w: w.batch(window_size))
    ds = ds.batch(32).prefetch(1)
    forecast = model.predict(ds)
    return forecast

# window_size =  30# YOUR CODE HERE
rnn_forecast = model_forecast(model, series[..., np.newaxis], window_size)
rnn_forecast = rnn_forecast[split_time - window_size:-1, -1, 0]

result = tf.keras.metrics.mean_absolute_error(x_valid, rnn_forecast).numpy()

# To get the maximum score, your model must have an MAE OF .12 or less.
# When you Submit and Test your model, the grading infrastructure
# converts the MAE of your model to a score from 0 to 5 as follows:

test_val = 100 * result
score = math.ceil(17 - test_val)
if score > 5:
    score = 5

print(score)

5
