# \Sigma_{a1} в зависимости от плотности теплоносителя, температуры теплоносителя, температуры топлива и концентрации борной кислоты

## 1. Загрузка данных

In [1]:
import pandas as pd

Загрузка данных

In [2]:
df = pd.read_excel('Input/Data.xlsx')
df.head(3)

Unnamed: 0,\rho(g/cm^3),T_c(K),T_f(K),c_b(ppm),3S_{tr1}(1),3S_{tr2}(2),\Sigma_{a1}(3),\Sigma_{a2}(4),nuS_{f1}(5),nuS_{f2}(6),\Sigma_{f1}(7),\Sigma_{f2}(8),\Sigma_{1->2}(9),k_{inf}(10),\sigma_{a2}^{Xe},\sigma_{a2}^{Sm}
0,0.7235,575.0,1027.0,600.0,0.661853,2.568298,0.009376,0.085584,0.006677,0.13325,0.00262,0.05475,0.017392,1.261041,1072970.0,35421.398
1,0.775,448.0,1043.0,1500.0,0.679602,2.874687,0.009581,0.098339,0.006723,0.139256,0.002636,0.057218,0.018726,1.174265,1141000.0,36147.801
2,0.9125,370.5,1418.0,750.0,0.727336,3.668742,0.009908,0.102815,0.006844,0.153823,0.002681,0.063203,0.022463,1.249619,1308480.0,39214.0


In [3]:
names = ['\\rho(g/cm^3)',
 'T_c(K)',
 'T_f(K)',
 'c_b(ppm)',
 '\Sigma_{a1}(3)']

In [4]:
df = df[names]
df.head(3)

Unnamed: 0,\rho(g/cm^3),T_c(K),T_f(K),c_b(ppm),\Sigma_{a1}(3)
0,0.7235,575.0,1027.0,600.0,0.009376
1,0.775,448.0,1043.0,1500.0,0.009581
2,0.9125,370.5,1418.0,750.0,0.009908


### 2 Нормализация признаков

In [5]:
features = ['\\rho(g/cm^3)',
 'T_c(K)',
 'T_f(K)',
 'c_b(ppm)']

In [6]:
df_features_norm = df.copy()

In [7]:
for i in range(len(features)):
    df_features_norm[features[i]] = (df[features[i]]-df[features[i]].mean())/df[features[i]].std()

In [8]:
df_features_norm

Unnamed: 0,\rho(g/cm^3),T_c(K),T_f(K),c_b(ppm),\Sigma_{a1}(3)
0,-0.316426,1.416398,-0.039094,-1.035019,0.009376
1,0.007922,-0.005506,-0.001946,0.006984,0.009581
2,0.873902,-0.873204,0.868693,-0.861352,0.009908
3,-0.858058,0.862191,-0.872586,0.875321,0.009156
4,-0.425067,-0.439355,0.433373,-1.295520,0.009418
...,...,...,...,...,...
252,-0.844527,-0.886762,-1.539169,-0.603564,0.008832
253,0.887433,0.848634,0.202111,1.133108,0.010004
254,0.021453,-0.019064,1.072750,-1.471900,0.009660
255,-1.710507,1.716332,-0.668529,0.264771,0.008792


In [9]:
df_features_norm.sample(frac=1) 

Unnamed: 0,\rho(g/cm^3),T_c(K),T_f(K),c_b(ppm),\Sigma_{a1}(3)
194,0.941557,-0.181757,-0.069965,-0.006584,0.009817
58,1.361016,-1.144360,1.140769,-1.566875,0.009975
200,-1.006898,-0.398682,1.453653,0.210500,0.009514
37,1.469262,0.482574,0.814277,-1.024165,0.010004
7,-1.291047,0.428343,1.304013,1.309489,0.009435
...,...,...,...,...,...
184,-1.196331,-0.968109,1.263202,0.834618,0.009442
151,-0.925712,0.170745,1.535275,-0.087989,0.009539
149,1.672228,1.038443,-1.076642,-0.956326,0.009562
209,0.400320,1.011327,1.344824,1.187379,0.010099


In [10]:
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(df_features_norm[['\\rho(g/cm^3)', 'T_c(K)', 'T_f(K)', 'c_b(ppm)']],
                                                    df_features_norm[['\\Sigma_{a1}(3)']],
                                                    test_size=0.33,
                                                    random_state=42)

# Нейросетевые модели

In [11]:
%%time

# Use scikit-learn to grid search the batch size and epochs
import numpy
from sklearn.model_selection import GridSearchCV
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasRegressor
import tensorflow as tf

# Function to create model, required for KerasRegressor
def create_model(activation='relu', learn_rate=0.01, momentum=0):
    # create model
    model = Sequential()
    model.add(Dense(4, input_dim=4, activation=activation))
    model.add(Dense(1, kernel_initializer='normal'))
    
    optimizer = tf.keras.optimizers.RMSprop(learning_rate = learn_rate, rho = 0.99, momentum = momentum, epsilon=1e-09)
    
    # Compile model
    model.compile(loss='mse', optimizer=optimizer)
    return model

X = X_train
Y = y_train

# create model
model = KerasRegressor(build_fn=create_model, verbose=0)

# define the grid search parameters
batch_size = [10, 15, 20]
epochs = [1000, 1200, 1300]
activation = ['tanh', 'sigmoid', 'linear']
learn_rate = [0.00015, 0.0002, 0.00025]
momentum = [0, 0.00001]

param_grid = dict(batch_size=batch_size,
                  epochs=epochs,
                  activation=activation,
                  learn_rate=learn_rate,
                  momentum=momentum
                 )
grid = GridSearchCV(estimator=model, param_grid=param_grid, n_jobs=5)
grid_result = grid.fit(X, Y)

# summarize results
print("Best: %f using %s" % (grid_result.best_score_, grid_result.best_params_))
means = grid_result.cv_results_['mean_test_score']
stds = grid_result.cv_results_['std_test_score']
params = grid_result.cv_results_['params']
for mean, stdev, param in zip(means, stds, params):
    print("%f (%f) with: %r" % (mean, stdev, param))

Best: -0.000000 using {'activation': 'linear', 'batch_size': 10, 'epochs': 1200, 'learn_rate': 0.00015, 'momentum': 0}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1000, 'learn_rate': 0.00015, 'momentum': 0}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1000, 'learn_rate': 0.00015, 'momentum': 1e-05}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1000, 'learn_rate': 0.0002, 'momentum': 0}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1000, 'learn_rate': 0.0002, 'momentum': 1e-05}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1000, 'learn_rate': 0.00025, 'momentum': 0}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1000, 'learn_rate': 0.00025, 'momentum': 1e-05}
-0.000000 (0.000000) with: {'activation': 'tanh', 'batch_size': 10, 'epochs': 1200, 'learn_rate': 0.00015, 'momentum': 0}
-0.000000 (0.0000

In [12]:
stop

NameError: name 'stop' is not defined

## Модель 1

In [13]:
def create_model():

    # create model
    model = Sequential()
    model.add(Dense(4, input_dim=4, activation='linear'))
    model.add(Dense(1, kernel_initializer='normal'))

    optimizer = tf.keras.optimizers.RMSprop(learning_rate = 0.00015, rho = 0.99, momentum = 0, epsilon=1e-09)
    
    # Compile model
    model.compile(loss='mse', optimizer=optimizer)
    return model

In [14]:
model = create_model()
model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_2 (Dense)              (None, 4)                 20        
_________________________________________________________________
dense_3 (Dense)              (None, 1)                 5         
Total params: 25
Trainable params: 25
Non-trainable params: 0
_________________________________________________________________


In [15]:
# Обучение модели

EPOCHS = 1200
batch_size = 10

history = model.fit(
  X, Y,
  epochs=EPOCHS, batch_size = batch_size,verbose=0)

In [16]:
hist = pd.DataFrame(history.history)
hist['epoch'] = history.epoch
hist.tail(10)

Unnamed: 0,loss,epoch
1190,8.743196e-09,1190
1191,2.892491e-08,1191
1192,8.711312e-08,1192
1193,2.408945e-07,1193
1194,1.564733e-08,1194
1195,3.288625e-08,1195
1196,2.849991e-07,1196
1197,7.408162e-09,1197
1198,7.885307e-08,1198
1199,4.699406e-08,1199


In [17]:
import statsmodels as statsmodels
import statsmodels.api as sm

RMSPE = statsmodels.tools.eval_measures.rmspe(y_test.values, model.predict(X_test))
RMSPE

array([0.08770652])

In [18]:
import statsmodels as statsmodels
import statsmodels.api as sm

RMSPE = statsmodels.tools.eval_measures.rmspe(y_train.values, model.predict(X_train))
RMSPE

array([0.06793273])