## 참고: https://hleecaster.com/ml-linear-regression-example/

## 라이브러리 설치, 호출

!pip3 install -U scikit-learn<br>
!pip3 install pandas<br>
!pip3 install numpy<br>
!pip3 install matplotlib<br>
!pip3 install statsmodels<br>

In [28]:
import tensorflow as tf
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import statsmodels.api as sm

from tensorflow.keras.models import Sequential, load_model
from tensorflow.keras.layers import Input, Dense, Concatenate, InputLayer
from tensorflow.keras.optimizers import SGD, Adam

from tensorflow.keras.callbacks import ModelCheckpoint, TensorBoard, ReduceLROnPlateau

from tensorflow.keras.models import Model

## 데이터 다운로드 (특별할인 판매)

In [29]:
import pandas as pd
TRAIN = pd.read_csv('LungCancer/train.csv')
VALID = pd.read_csv('LungCancer/valid.csv')

In [30]:
TRAIN.head()

Unnamed: 0,Relapse,CEA_Post,Lymphatic,Vascular,pStage,pT,pN,Perineural,Age
0,0,0.0,0,0,4,2,2,0,73
1,0,1.2,1,0,4,2,2,1,73
2,1,1.8,1,0,4,1,2,0,53
3,0,0.0,1,0,4,2,2,0,57
4,1,52.0,1,1,6,4,3,0,65


# Input, Feature 설정

In [31]:
TRAIN_y = TRAIN[['Relapse']]
TRAIN_x = TRAIN[ TRAIN.columns[1:] ]

VALID_y = VALID[['Relapse']]
VALID_x = VALID[ VALID.columns[1:] ]

In [32]:
TRAIN_x1 = TRAIN_x.iloc[:, :4]
TRAIN_x2 = TRAIN_x.iloc[:, 4:8]

In [33]:
VALID_x1 = VALID_x.iloc[:, :4]
VALID_x2 = VALID_x.iloc[:, 4:8]

## Keras, Multiple-input Logit 모델 architecture

In [34]:
InputA = Input(shape=(TRAIN_x1.shape[1],), dtype='int32', name='inputA')
x = Dense(10, activation='relu')(InputA)
OutputA = Dense(4, activation='relu')(x)

In [35]:
InputB = Input(shape=(TRAIN_x2.shape[1],), dtype='int32', name='inputB')
x = Dense(10, activation='relu')(InputB)
OutputB = Dense(4, activation='relu')(x)

In [36]:
Merged = Concatenate(axis=1)([OutputA, OutputB])
Output = Dense(1, activation='sigmoid')(Merged)

In [37]:
Model = tf.keras.models.Model(inputs=[InputA, InputB], outputs=Output)

In [38]:
Model.summary()

Model: "model_4"
__________________________________________________________________________________________________
 Layer (type)                   Output Shape         Param #     Connected to                     
 inputA (InputLayer)            [(None, 4)]          0           []                               
                                                                                                  
 inputB (InputLayer)            [(None, 4)]          0           []                               
                                                                                                  
 dense_10 (Dense)               (None, 10)           50          ['inputA[0][0]']                 
                                                                                                  
 dense_12 (Dense)               (None, 10)           50          ['inputB[0][0]']                 
                                                                                            

In [39]:
Model.compile(loss='binary_crossentropy',optimizer=Adam(learning_rate=0.001))

In [40]:
Model.fit(x=[TRAIN_x1, TRAIN_x2], y=TRAIN_y, epochs=300, shuffle=True)

Epoch 1/300

2022-07-13 11:15:59.520371: I tensorflow/core/grappler/optimizers/custom_graph_optimizer_registry.cc:113] Plugin optimizer for device_type GPU is enabled.


Epoch 2/300
Epoch 3/300
Epoch 4/300
Epoch 5/300
Epoch 6/300
Epoch 7/300
Epoch 8/300
Epoch 9/300
Epoch 10/300
Epoch 11/300
Epoch 12/300
Epoch 13/300
Epoch 14/300
Epoch 15/300
Epoch 16/300
Epoch 17/300
Epoch 18/300
Epoch 19/300
Epoch 20/300
Epoch 21/300
Epoch 22/300
Epoch 23/300
Epoch 24/300
Epoch 25/300
Epoch 26/300
Epoch 27/300
Epoch 28/300
Epoch 29/300
Epoch 30/300
Epoch 31/300
Epoch 32/300
Epoch 33/300
Epoch 34/300
Epoch 35/300
Epoch 36/300
Epoch 37/300
Epoch 38/300
Epoch 39/300
Epoch 40/300
 1/13 [=>............................] - ETA: 0s - loss: 0.8471

KeyboardInterrupt: 

In [None]:
!pip install pydot

In [27]:
tf.keras.utils.plot_model(model=Model, show_shapes=True)

You must install pydot (`pip install pydot`) and install graphviz (see instructions at https://graphviz.gitlab.io/download/) for plot_model/model_to_dot to work.


In [48]:
# Call-back 함수
# CheckPoint: Epoch 마다 validation 성능을 검증하여, best performance 일 경우 저장
CP = ModelCheckpoint(filepath='{epoch:03d}-{loss:.4f}-{val_loss:.4f}.hdf5',
            monitor='val_loss', verbose=1, save_best_only=True, mode='min')
#minitor -> loss -> val_loss

# Learning Rate 줄여나가기
LR = ReduceLROnPlateau(monitor='val_loss', factor=0.6, patience=4,
                       verbose=1, min_lr=1e-8)
# factor: Learning rate에 곱할 것.
#0.1 -> 0.08 -> 0.064 ....
#monitor='loss' -> monitor='val_loss'

CALLBACK = [CP, LR]

In [49]:
Model.fit(x=[TRAIN_x1, TRAIN_x2], y=TRAIN_y, epochs=5, shuffle=True,
          batch_size=32, callbacks=CALLBACK, validation_data = ([VALID_x1, VALID_x2], VALID_y))

Epoch 1/5
 1/13 [=>............................] - ETA: 0s - loss: 0.8994
Epoch 1: val_loss improved from inf to 1.00253, saving model to 001-1.0442-1.0025.hdf5
Epoch 2/5
 1/13 [=>............................] - ETA: 0s - loss: 0.9527
Epoch 2: val_loss improved from 1.00253 to 0.99973, saving model to 002-1.0398-0.9997.hdf5
Epoch 3/5
 1/13 [=>............................] - ETA: 0s - loss: 1.1481
Epoch 3: val_loss improved from 0.99973 to 0.99652, saving model to 003-1.0347-0.9965.hdf5
Epoch 4/5
 1/13 [=>............................] - ETA: 0s - loss: 0.9468
Epoch 4: val_loss improved from 0.99652 to 0.99268, saving model to 004-1.0304-0.9927.hdf5
Epoch 5/5
 1/13 [=>............................] - ETA: 0s - loss: 0.7411
Epoch 5: val_loss improved from 0.99268 to 0.99069, saving model to 005-1.0254-0.9907.hdf5


<keras.callbacks.History at 0x1cd582d1f30>