In [1]:
########################################################################
# import python-library
########################################################################
import pickle
import os
import sys
import glob

import numpy as np
import librosa
import librosa.core
import librosa.feature
import yaml
import logging
import keras

from tqdm import tqdm
from sklearn import metrics
from keras.models import Model
from keras.layers import Input, Dense

from itertools import combinations
########################################################################



########################################################################
# setup STD I/O
########################################################################
# 로깅을 설정하고 초기화하는 부분
logging.basicConfig(level=logging.DEBUG, filename="make_pretrain_v3.log")
logger = logging.getLogger(' ')
handler = logging.StreamHandler()
formatter = logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')
handler.setFormatter(formatter)
logger.addHandler(handler)
########################################################################



########################################################################
# file I/O
########################################################################
#파일 입출력 관련 함수 선언 부분
def save_pickle(filename, save_data):  
    logger.info("save_pickle -> {}".format(filename))
    with open(filename, 'wb') as sf:
        pickle.dump(save_data, sf)

def load_pickle(filename):
    logger.info("load_pickle <- {}".format(filename))
    with open(filename, 'rb') as lf:
        load_data = pickle.load(lf)
    return load_data


def file_load(wav_name, mono=False):
    try:
        return librosa.load(wav_name, sr=None, mono=mono)
    except:
        logger.error("file_broken or not exists!! : {}".format(wav_name))


def demux_wav(wav_name, channel=0):
    try:
        multi_channel_data, sr = file_load(wav_name)
        if multi_channel_data.ndim <= 1:
            return sr, multi_channel_data
        return sr, np.array(multi_channel_data)[channel, :]
    except ValueError as msg:
        logger.warning(f'{msg}')
########################################################################





########################################################################
# feature extractor
########################################################################
#소리 파일 하나를 로그멜스펙트로그램 형태로 바꾸고 딥러닝 모델에 넣을 형태로 바꾸는 함수 
def file_to_vector_array(file_name, n_mels=64, frames=5, n_fft=1024, hop_length=512, power=2.0):
    dims = n_mels * frames
    sr, y = demux_wav(file_name)
    mel_spectrogram = librosa.feature.melspectrogram(y=y, sr=sr, n_fft=n_fft, hop_length=hop_length, n_mels=n_mels, power=power)
    log_mel_spectrogram = 20.0 / power * np.log10(mel_spectrogram + sys.float_info.epsilon)
    vectorarray_size = len(log_mel_spectrogram[0, :]) - frames + 1
    if vectorarray_size < 1:
        return np.empty((0, dims), float)
    vectorarray = np.zeros((vectorarray_size, dims), float)
    for t in range(frames):
        vectorarray[:, n_mels * t: n_mels * (t + 1)] = log_mel_spectrogram[:, t: t + vectorarray_size].T 
    return vectorarray

#소리 파일들의 이름명이 담긴 리스트를 입력하면 그것들을 하나의 데이터셋으로 합치는 함수
def list_to_vector_array(file_list, msg="calc...", n_mels=64, frames=5, n_fft=1024, hop_length=512, power=2.0):
    dims = n_mels * frames
    for idx in tqdm(range(len(file_list)), desc=msg):
        vector_array = file_to_vector_array(file_list[idx], n_mels=n_mels, frames=frames, n_fft=n_fft, hop_length=hop_length,power=power)
        if idx == 0:
            dataset = np.zeros((vector_array.shape[0] * len(file_list), dims), float)
        dataset[vector_array.shape[0] * idx: vector_array.shape[0] * (idx + 1), :] = vector_array       
    return dataset


def dataset_generator(target_dir, machine_type, normal_dir_name="normal", ext="wav"):
    logger.info("target_dir : {}".format(target_dir))
    train_files = []
    machine_id = f"-6dB_{machine_type}"
    machine = f"{machine_type}"
    id_list = ["id_00", "id_02", "id_04", "id_06"]
    machine_type_path = os.path.join(target_dir, machine_id, machine)
    for id_ in id_list:
        machine_id = f"{id_}"
        machine_id_path = os.path.join(machine_type_path, machine_id, normal_dir_name)
        normal_files = sorted(glob.glob(os.path.join(machine_id_path, f"*.{ext}")))
        train_files.extend(normal_files)
    logger.info("train_file num : {num}".format(num=len(train_files)))
    return train_files
########################################################################




########################################################################
# keras model
########################################################################
#오토인코더 함수
def keras_model(inputDim):
    inputLayer = Input(shape=(inputDim,))
    h = Dense(64, activation="relu")(inputLayer)    
    h = Dense(64, activation="relu")(h)
    h = Dense(8, activation="relu")(h)
    h = Dense(64, activation="relu")(h)
    h = Dense(64, activation="relu")(h)
    h = Dense(inputDim, activation=None)(h)
    return Model(inputs=inputLayer, outputs=h)
########################################################################




########################################################################
# main
########################################################################
# 메인 실행 부분
if __name__ == "__main__":
    with open("make_pretrain_v3.yaml", encoding='utf-8') as stream:
        pretrain_v3_param = yaml.safe_load(stream)

    os.makedirs(pretrain_v3_param["pickle_directory"], exist_ok=True)
    os.makedirs(pretrain_v3_param["model_directory"], exist_ok=True)
    pretrain_v3_data_dir = pretrain_v3_param["base_directory"]
    machine_types = ["fan", "valve", "slider", "pump"]
    print("\n===========================")

    # combination함수를 사용하여 macine_types에 있는 기계 타입을 2개씩 뽑음. 그리고 하나의 데이터셋으로 만든다
    for combo in combinations(machine_types, 2):
        combo_ = f"{combo}"
        combo_train_files = []
        
        train_pickle = "{pickle}/pretrain_{combo}.pickle".format(pickle=pretrain_v3_param["pickle_directory"],combo=combo_)
        for machine_type in combo:
            db = f"-6dB_{machine_type}"
            train_files = dataset_generator(pretrain_v3_data_dir, machine_type)
            combo_train_files.extend(train_files)
        
        if os.path.exists(train_pickle):
            train_data = load_pickle(train_pickle)
        else: 
            train_data = list_to_vector_array(combo_train_files,
                                          msg="generate train_dataset",
                                          n_mels=pretrain_v3_param["feature"]["n_mels"],
                                          frames=pretrain_v3_param["feature"]["frames"],
                                          n_fft=pretrain_v3_param["feature"]["n_fft"],
                                          hop_length=pretrain_v3_param["feature"]["hop_length"],
                                          power=pretrain_v3_param["feature"]["power"])
            save_pickle(train_pickle, train_data)

        print("============== MODEL TRAINING ==============")
        model_directory = pretrain_v3_param["model_directory"]
        model_file = "{model}/pretrain_{combo}.h5".format(model=model_directory, combo=combo_)
        if not os.path.exists(model_file):
            model = keras_model(pretrain_v3_param["feature"]["n_mels"] * pretrain_v3_param["feature"]["frames"])
            model.summary()
            model.compile(**pretrain_v3_param["fit"]["compile"])
            model.fit(train_data,
                      train_data,
                      epochs=pretrain_v3_param["fit"]["epochs"],
                      batch_size=pretrain_v3_param["fit"]["batch_size"],
                      shuffle=pretrain_v3_param["fit"]["shuffle"],
                      validation_split=pretrain_v3_param["fit"]["validation_split"],
                      verbose=pretrain_v3_param["fit"]["verbose"])
            model.save(model_file)



2023-08-26 01:01:15,167 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:15,171 - INFO - train_file num : 40
2023-08-26 01:01:15,172 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:15,174 - INFO - train_file num : 40





generate train_dataset: 100%|██████████████████████████████████████████████████████████| 80/80 [00:03<00:00, 22.67it/s]
2023-08-26 01:01:18,710 - INFO - save_pickle -> ./pickle_pretrain_v3/pretrain_('fan', 'valve').pickle


Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_1 (InputLayer)        [(None, 320)]             0         
                                                                 
 dense (Dense)               (None, 64)                20544     
                                                                 
 dense_1 (Dense)             (None, 64)                4160      
                                                                 
 dense_2 (Dense)             (None, 8)                 520       
                                                                 
 dense_3 (Dense)             (None, 64)                576       
                                                                 
 dense_4 (Dense)             (None, 64)                4160      
                                                                 
 dense_5 (Dense)             (None, 320)               20800 

  saving_api.save_model(
2023-08-26 01:01:27,704 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:27,705 - INFO - train_file num : 40
2023-08-26 01:01:27,706 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:27,708 - INFO - train_file num : 40
generate train_dataset: 100%|██████████████████████████████████████████████████████████| 80/80 [00:00<00:00, 81.60it/s]
2023-08-26 01:01:28,696 - INFO - save_pickle -> ./pickle_pretrain_v3/pretrain_('fan', 'slider').pickle


Model: "model_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_2 (InputLayer)        [(None, 320)]             0         
                                                                 
 dense_6 (Dense)             (None, 64)                20544     
                                                                 
 dense_7 (Dense)             (None, 64)                4160      
                                                                 
 dense_8 (Dense)             (None, 8)                 520       
                                                                 
 dense_9 (Dense)             (None, 64)                576       
                                                                 
 dense_10 (Dense)            (None, 64)                4160      
                                                                 
 dense_11 (Dense)            (None, 320)               2080

2023-08-26 01:01:37,270 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:37,271 - INFO - train_file num : 40
2023-08-26 01:01:37,272 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:37,274 - INFO - train_file num : 40
generate train_dataset: 100%|██████████████████████████████████████████████████████████| 80/80 [00:00<00:00, 82.55it/s]
2023-08-26 01:01:38,252 - INFO - save_pickle -> ./pickle_pretrain_v3/pretrain_('fan', 'pump').pickle


Model: "model_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_3 (InputLayer)        [(None, 320)]             0         
                                                                 
 dense_12 (Dense)            (None, 64)                20544     
                                                                 
 dense_13 (Dense)            (None, 64)                4160      
                                                                 
 dense_14 (Dense)            (None, 8)                 520       
                                                                 
 dense_15 (Dense)            (None, 64)                576       
                                                                 
 dense_16 (Dense)            (None, 64)                4160      
                                                                 
 dense_17 (Dense)            (None, 320)               2080

2023-08-26 01:01:46,767 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:46,769 - INFO - train_file num : 40
2023-08-26 01:01:46,770 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:46,772 - INFO - train_file num : 40
generate train_dataset: 100%|██████████████████████████████████████████████████████████| 80/80 [00:00<00:00, 83.21it/s]
2023-08-26 01:01:47,742 - INFO - save_pickle -> ./pickle_pretrain_v3/pretrain_('valve', 'slider').pickle


Model: "model_3"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_4 (InputLayer)        [(None, 320)]             0         
                                                                 
 dense_18 (Dense)            (None, 64)                20544     
                                                                 
 dense_19 (Dense)            (None, 64)                4160      
                                                                 
 dense_20 (Dense)            (None, 8)                 520       
                                                                 
 dense_21 (Dense)            (None, 64)                576       
                                                                 
 dense_22 (Dense)            (None, 64)                4160      
                                                                 
 dense_23 (Dense)            (None, 320)               2080

2023-08-26 01:01:56,485 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:56,487 - INFO - train_file num : 40
2023-08-26 01:01:56,488 - INFO - target_dir : ../Sample_data
2023-08-26 01:01:56,489 - INFO - train_file num : 40
generate train_dataset: 100%|██████████████████████████████████████████████████████████| 80/80 [00:00<00:00, 81.68it/s]
2023-08-26 01:01:57,478 - INFO - save_pickle -> ./pickle_pretrain_v3/pretrain_('valve', 'pump').pickle


Model: "model_4"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_5 (InputLayer)        [(None, 320)]             0         
                                                                 
 dense_24 (Dense)            (None, 64)                20544     
                                                                 
 dense_25 (Dense)            (None, 64)                4160      
                                                                 
 dense_26 (Dense)            (None, 8)                 520       
                                                                 
 dense_27 (Dense)            (None, 64)                576       
                                                                 
 dense_28 (Dense)            (None, 64)                4160      
                                                                 
 dense_29 (Dense)            (None, 320)               2080

2023-08-26 01:02:06,388 - INFO - target_dir : ../Sample_data
2023-08-26 01:02:06,390 - INFO - train_file num : 40
2023-08-26 01:02:06,391 - INFO - target_dir : ../Sample_data
2023-08-26 01:02:06,393 - INFO - train_file num : 40
generate train_dataset: 100%|██████████████████████████████████████████████████████████| 80/80 [00:00<00:00, 83.35it/s]
2023-08-26 01:02:07,362 - INFO - save_pickle -> ./pickle_pretrain_v3/pretrain_('slider', 'pump').pickle


Model: "model_5"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_6 (InputLayer)        [(None, 320)]             0         
                                                                 
 dense_30 (Dense)            (None, 64)                20544     
                                                                 
 dense_31 (Dense)            (None, 64)                4160      
                                                                 
 dense_32 (Dense)            (None, 8)                 520       
                                                                 
 dense_33 (Dense)            (None, 64)                576       
                                                                 
 dense_34 (Dense)            (None, 64)                4160      
                                                                 
 dense_35 (Dense)            (None, 320)               2080