# Train NF

Import necessary libraries

In [None]:
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import seaborn as sns

import tensorflow as tf
from tensorflow import keras

from sklearn.preprocessing import StandardScaler

import warnings
warnings.filterwarnings("ignore")

In [None]:
print(f"Versión de TensorFlow: {tf.__version__}")

Versión de TensorFlow: 2.15.0


Download data

In [None]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
path = "..."

In [None]:
X_train = np.load(path + 'X_train.npy')
y_train = np.load(path + 'y_train.npy') # (alpha, theta, ratio)

We standardize the target variables (parameters) to improve the performance of NN.

In [None]:
y_scaler = StandardScaler()
y_train = y_scaler.fit_transform(y_train)

In [None]:
y_scaler.mean_

array([1.49225652, 2.07506667, 0.49766667])

In [None]:
y_scaler.scale_

array([0.90576534, 1.15612128, 0.2267739 ])

Save ``y_scaler``

In [2]:
import joblib
print(f'{joblib.__version__}')

1.4.2


In [None]:
joblib.dump(y_scaler, path + 'y_scaler.pkl')

Augment the data by rotating the fields by $180$ degrees

In [None]:
def augment_data(x, y):
    augmented_X = []
    augmented_y = []

    for x_sample, y_sample in zip(x, y):
        augmented_X.append(x_sample)
        augmented_y.append(y_sample)

        # Rotar la matriz en 180 grados
        rotated_x = np.rot90(x_sample,2)
        augmented_X.append(rotated_x)
        augmented_y.append(y_sample)

    return tf.convert_to_tensor(augmented_X), tf.convert_to_tensor(augmented_y)

class DataGenerator(keras.utils.Sequence):
    def __init__(self, X, y, batch_size, shuffle=True):
        self.X = X
        self.y = y
        self.batch_size = batch_size
        self.shuffle = shuffle
        self.indexes = np.arange(len(self.X))
        if self.shuffle:
            np.random.shuffle(self.indexes)

    def __len__(self):
        return int(np.ceil(len(self.X) / self.batch_size))

    def __getitem__(self, index):
        indexes = self.indexes[index * self.batch_size:(index + 1) * self.batch_size]

        X_batch = [self.X[i] for i in indexes]
        y_batch = [self.y[i] for i in indexes]

        return augment_data(X_batch, y_batch)

In [None]:
model = keras.Sequential([
    keras.layers.Conv2D(filters=128, kernel_size=9, input_shape=(16,16,1), activation='relu'),
    keras.layers.Conv2D(filters=256, kernel_size=5, activation='relu'),
    keras.layers.Conv2D(filters=512, kernel_size=4, activation='relu'),
    keras.layers.Conv2D(filters=1024, kernel_size=1, activation='relu'),
    keras.layers.Flatten(),
    keras.layers.Dense(300, activation='relu'),
    keras.layers.Dense(3)
])
model.compile(optimizer=keras.optimizers.AdamW(),
              loss=keras.losses.MeanAbsoluteError(),
              metrics=[keras.metrics.MeanSquaredError()])
model.summary()

Model: "sequential_6"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_23 (Conv2D)          (None, 8, 8, 128)         10496     
                                                                 
 conv2d_24 (Conv2D)          (None, 4, 4, 256)         819456    
                                                                 
 conv2d_25 (Conv2D)          (None, 1, 1, 512)         2097664   
                                                                 
 conv2d_26 (Conv2D)          (None, 1, 1, 1024)        525312    
                                                                 
 flatten_6 (Flatten)         (None, 1024)              0         
                                                                 
 dense_16 (Dense)            (None, 300)               307500    
                                                                 
 dense_17 (Dense)            (None, 3)                

In [None]:
batch_size = 500
generator = DataGenerator(X_train, y_train, batch_size)

In [None]:
%%time
history = model.fit(generator,
                    epochs = 50,
                    verbose = 1,
                    )

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50
CPU times: user 44min 3s, sys: 52.6 s, total: 44min 56s
Wall time: 39min 31s


In [None]:
X_test = np.load(path + 'X_test.npy')

y_pred_test = y_scaler.inverse_transform(model.predict(X_test, verbose = 0))
y_pred_test

array([[ 2.975435  ,  1.0755346 ,  0.40735844],
       [ 2.991985  ,  1.1226343 ,  0.3593339 ],
       [-0.04057837,  1.0856812 ,  0.29411298],
       ...,
       [ 0.6562753 ,  3.1020145 ,  0.81865036],
       [ 0.6737718 ,  3.0899575 ,  0.7606943 ],
       [ 0.15253878,  2.8015354 ,  0.5997586 ]], dtype=float32)

In [None]:
np.save(path+'y_pred_NF.npy', y_pred_test)

Save trained NN

In [None]:
model.save(path+'model.keras')