In [9]:
from lib.config import Config_f
from lib.data_set import Features
from lib.model import SimpleModel
from lib import utils

In [15]:
import imp
imp.reload(utils)

<module 'utils' from 'E:\\Document\\jupyter\\Master Thesis\\utils.py'>

In [3]:
import ctypes
import pandas as pd
import numpy as np
import pywt
import time
import matplotlib.pyplot as plt

from sklearn.preprocessing import OneHotEncoder, StandardScaler, MinMaxScaler
from sklearn.feature_selection import SelectKBest,f_classif,chi2,mutual_info_classif,VarianceThreshold,RFE,SelectFromModel
from sklearn.ensemble import GradientBoostingClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.decomposition import PCA
from sklearn.metrics import confusion_matrix,accuracy_score

from tensorflow.keras import layers as KL
from tensorflow.keras import models as KM
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow import keras
import tensorflow as tf

## File name read

In [4]:
# read file name of data with various Labels
df = pd.read_csv('./useful_data_label.csv',index_col=0) 
# read file name of data with only label 0
df2 = pd.read_csv('./unuseful_data_label.csv',index_col=0)
# read some of the data with only label 0
df3 = pd.read_csv('./data/file_name.txt',header=None)
player = ctypes.windll.kernel32

ind = df2.iloc[1].isna()
files = np.concatenate([np.array(df.columns),np.array('normal/'+df2.columns[ind])])

## Configuration

In [5]:
# Override the base class of Config and Features for ANN Model
class ANN_Config(Config_f):
    NAME = 'ANN'
    NUM_CLASSES = 2
    EPOCHS = 300
    BATCH_SIZE = 32
    CLASS_WEIGHTS = None
    COST_SENSITIVE = False
    
    FN_LP = 300
    DETREND_LAMBDA = 50
    TEST_FILES = files[[6,30,31,32,33,34,35]]
    
    
class ANN_dataset(Features):
    
    def __init__(self,config):
        super(ANN_dataset,self).__init__(config)
        self.config = config
        

In [6]:
# Generate ANN configuration
config = ANN_Config()
config.display()


Configurations:
BATCH_SIZE                     32
BINS                           3
CHANNELS                       ['LEFT_TA', 'LEFT_TS', 'LEFT_BF', 'LEFT_RF', 'RIGHT_TA', 'RIGHT_TS', 'RIGHT_BF', 'RIGHT_RF']
CLASS_WEIGHTS                  None
COST_SENSITIVE                 False
DETREND_LAMBDA                 50
EPOCHS                         300
FEATURES_LIST                  ['IEMG', 'SSI', 'WL', 'ZC', 'ku', 'SSC', 'skew', 'Acti', 'AR', 'HIST', 'MDF', 'MNF', 'mDWT']
FN_LP                          300
LEVEL_DWT                      3
NAME                           ANN
NUM_CLASSES                    2
NUM_MF                         3
N_ENV                          20
RANGES                         (-3, 3)
RECT                           False
SAME_LABEL                     True
SCALE                          True
SHUFFLE                        True
STEP_SIZE                      512
TEST_FILES                     ['G08_FoG_1_trial_1_emg.csv' 'normal/G09_Walking_trial_2_emg.csv'
 'norma

## Data generate

In [7]:
data = ANN_dataset(config)

In [8]:
# Choose features to use
data.feature_list = ['IEMG', 'SSI', 'WL', 'ZC', 'ku', 'SSC', 'skew', 'Acti', 'AR', 'HIST', 'MF','MDF', 'MNF', 'mDWT']
data.num_mf = 10

# Load data from files
data.load_data(files)

# Extract features from data
data.extract_features()

X_train,Y_train,_ = data.train_set
X_valid,Y_valid,_ = data.valid_set
X_test, Y_test, _ = data.test_set

skip
skip


NameError: name 'utils' is not defined

## Model

In [11]:
# Override base class of SimpleMode for ANN
class ANN_Model(SimpleModel):
    
    def build(self,config):
        
        reg = keras.regularizers.l1(0)
        acti = 'relu'
        drop = 0.2
        init = 'glorot_normal'

        model = KM.Sequential()
        #model.add(layers.BatchNormalization())
        model.add(KL.Dense(128,
                               kernel_initializer=init,
                               kernel_regularizer = reg,
                               #use_bias=False
                         ))
        # model.add(layers.BatchNormalization())
        model.add(KL.Activation(acti))
        # model.add(layers.LeakyReLU(0.3))
        model.add(KL.Dropout(drop))

        model.add(KL.Dense(64,
                               kernel_initializer=init,
                               kernel_regularizer = reg,
                              # use_bias=False
                         ))
        # model.add(layers.BatchNormalization())
        model.add(KL.Activation(acti))
        # model.add(layers.LeakyReLU(0.1))
        model.add(KL.Dropout(drop))

        model.add(KL.Dense(32,
                               kernel_initializer=init,
                               kernel_regularizer = reg,
                               #use_bias=False
                         ))
        # model.add(layers.BatchNormalization())
        model.add(KL.Activation(acti))
        # model.add(layers.LeakyReLU(0.1))
        model.add(KL.Dropout(drop))

        model.add(KL.Dense(16,
                               kernel_initializer=init,
                               kernel_regularizer = reg,
                               #use_bias=False
                         ))
        # model.add(layers.BatchNormalization())
        model.add(KL.Activation(acti))
        # model.add(layers.LeakyReLU(0.1))
        model.add(KL.Dropout(drop))

        model.add(KL.Dense(config.NUM_CLASSES,activation='softmax'))

        
        if config.COST_SENSITIVE:
            self.cost_matrix = config.COST_MATRIX
            model.compile(loss=self.sparse_cost_sensitive_loss, optimizer="adam", metrics=['accuracy'])
            print('Using cost sensitive with cost matrix:\n',np.array(self.cost_matrix))
        else:
            model.compile(loss='categorical_crossentropy', optimizer="adam", metrics=['accuracy'])
            if config.CLASS_WEIGHTS != None:
                print('Using categorical crossentropy with class weights:\n',config.CLASS_WEIGHTS)
            else:
                print('Using categorical crossentropy without class weights.')
        
        return model
    
    def train(self, train_dataset, val_dataset, transformer=None, callbacks=None):
        
        self.X_train = train_dataset[0]
        scaler = MinMaxScaler()
        X_train = scaler.fit_transform(train_dataset[0])
        
        scaler.fit(np.concatenate([train_dataset[0],val_dataset[0]]))
        X_val = scaler.transform(val_dataset[0])
        
        if transformer != None:
            self.transformer = transformer
            self.transformer.fit(X_train,train_dataset[1])
            X_train = self.transformer.transform(X_train)
            X_val = self.transformer.transform(X_val)
        else:
            self.transformer = None

        self.simple_model.fit(X_train,
                              train_dataset[1],
                              validation_data=(X_val,val_dataset[1]),
                              epochs=self.config.EPOCHS,
                              batch_size=self.config.BATCH_SIZE,
                              class_weight=self.config.CLASS_WEIGHTS,
                              callbacks=callbacks,
                              shuffle=True)

    def sparse_cost_sensitive_loss (self,y_true,y_pred):
        cost_matrix = self.cost_matrix
        batch_cost_matrix = tf.nn.embedding_lookup(cost_matrix, tf.argmax(y_true,axis=1))
        eps = 1e-6
        probability = tf.clip_by_value(y_pred, eps, 1-eps)
        cost_values = tf.math.log(1-probability)*batch_cost_matrix
        loss = tf.reduce_mean(-tf.reduce_sum(cost_values, axis=1))
        return loss
    
    def model_metrics(self,data,label):
        pred = self.predict(data)
        acc = accuracy_score(np.argmax(label,axis=1),np.argmax(pred,axis=1))
        cm = confusion_matrix(np.argmax(label,axis=1),np.argmax(pred,axis=1))
        return acc,cm

## Data split

In [22]:
# data split and processing for model
class_id = [2,6]
binary = True
x_train,y_train,x_valid,y_valid,x_test,y_test = utils.data_split_oh((X_train,X_valid,X_test),
                                                                    (Y_train,Y_valid,Y_test),
                                                                    class_id,
                                                                    binary,
                                                                    random_state = 555)

## Model training

In [30]:
config.EPOCHS = 300
config.NUM_CLASSES = 2
config.CLASS_WEIGHTS = None#{0:1,1:5}

config.COST_MATRIX = tf.constant([[0,1.],
              [10,0]])

if binary:
    config.COST_SENSITIVE = True
    config.NUM_CLASSES = 2
else:
    config.COST_SENSITIVE = False
    config.NUM_CLASSES = len(class_id)

# Generate ANN Model
ANN_model = ANN_Model('ANN',config,'./model/ANN/')

Using categorical crossentropy without class weights.


In [31]:
pca = PCA(n_components=150,copy=True)
sfm = SelectFromModel(GradientBoostingClassifier(),max_features=80)
rfe = RFE(estimator=LogisticRegression(max_iter=10000), n_features_to_select=100)
vt = VarianceThreshold(threshold=0.01)

early_stopping = keras.callbacks.EarlyStopping(patience = 10,
                                             monitor = 'val_loss', 
                                             #baseline = 0.9,
                                             restore_best_weights=True)

ANN_model.train((x_train,y_train),
                (x_valid,y_valid),
                pca,
                [early_stopping])

Epoch 1/300
Epoch 2/300
Epoch 3/300
Epoch 4/300
Epoch 5/300
Epoch 6/300
Epoch 7/300
Epoch 8/300
Epoch 9/300
Epoch 10/300
Epoch 11/300
Epoch 12/300
Epoch 13/300
Epoch 14/300
Epoch 15/300
Epoch 16/300
Epoch 17/300
Epoch 18/300
Epoch 19/300
Epoch 20/300
Epoch 21/300
Epoch 22/300
Epoch 23/300
Epoch 24/300
Epoch 25/300
Epoch 26/300
Epoch 27/300


## Model evaluation

In [32]:
acc_train,cm_train = ANN_model.model_metrics(x_train,y_train)
acc_valid,cm_valid = ANN_model.model_metrics(x_valid,y_valid)
acc_test,cm_test = ANN_model.model_metrics(x_test,y_test)
print('acc_train: %f\nconfusion_matrix:\n'%acc_train,cm_train,'\n')
print('acc_valid: %f\nconfusion_matrix:\n'%acc_valid,cm_valid,'\n')
print('acc_test: %f\nconfusion_matrix:\n'%acc_test,cm_test)

acc_train: 1.000000
confusion_matrix:
 [[259   0]
 [  0 161]] 

acc_valid: 0.964539
confusion_matrix:
 [[93  3]
 [ 2 43]] 

acc_test: 0.926174
confusion_matrix:
 [[55  2]
 [ 9 83]]
