In [1]:
from audio_preprocessing.cut_audio_segment_from_audio_file import AudioProcessor
from feature_extraction.feature_extractor import FeatureExtractor
from feature_extraction.mfcc_images_extractor import MelSpectrogramImageExtractor
from data_processing.english_data_processing import ModelEvaluator
from itertools import combinations
from sklearn.ensemble import ExtraTreesClassifier
from sklearn.ensemble import RandomForestClassifier
import pandas as pd

In [2]:
def extract_mfcc_images(n_mfcc, figsize, input_folder, output_folder):
    mfccImageExtractor = MelSpectrogramImageExtractor(n_mfcc, figsize)
    mfccImageExtractor.extract_from_folders(input_folder, output_folder)

In [3]:
def cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, input_folder, output_folder):
    segmentation = AudioProcessor(frame_size, hop_size, threshold)
    segmentation.process_folders(input_folder, output_folder)

In [4]:
def extract_feature(n_mfcc, input_folder, output_folder, selected_features):
    featureExtractor = FeatureExtractor(n_mfcc)
    featureExtractor.process_folder(input_folder, output_folder, selected_features)
    # featureExtractor.process_folder(input_folder, output_folder, ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

In [5]:
def model(featured_data):
    models = [RandomForestClassifier, ExtraTreesClassifier]
    
    df_train_test = pd.read_csv(featured_data)
    df_shuffled = df_train_test.sample(frac=1, random_state=42).reset_index(drop=True)

    modelEvaluator = ModelEvaluator(models)
    best_model, best_scaler, best_avg_acc = modelEvaluator.evaluate_models(df_shuffled)
    return best_model, best_scaler, best_avg_acc

In [6]:
def process_data(frame_size, hop_size, threshold, raw_folder, cutted_folder, n_mfcc_list, featured_data_path, n_mfcc_for_images, images_folder, features):
    cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, raw_folder, cutted_folder)
    n = len(features)

    results = []

    for n_mfcc in n_mfcc_list:
        for r in range(0, n + 1):
            for combo in combinations(range(n), r):
                selected_features = [features[i] for i in range(n) if i not in combo]
                extract_feature(n_mfcc, cutted_folder, featured_data_path, selected_features)
                current_model, current_scaler, current_avg_acc = model(featured_data_path)
                print(f"Scaler: {current_scaler}, Model: {current_model}, n_mfcc: {n_mfcc}, Selected features: {selected_features}, Accuracy: {current_avg_acc}")
                results.append({'Scaler': current_scaler, 'Model': current_model, 'N_MFCC': n_mfcc, 'Selected Features': selected_features, 'Average Accuracy': current_avg_acc})

    results_df = pd.DataFrame(results)
    ranked_results = results_df.sort_values(by='Average Accuracy', ascending=False)

    return ranked_results

In [7]:
process_data(256, 128, 0.015, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/combined_data', 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/cleaned_data3', [13,20,26,40], 'D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv', 100, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/images', ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

  return ste / np.max(ste)
[32m2024-05-22 15:11:13.167[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m148[0m - [1mProcessing input folder: D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/cleaned_data3[0m
[32m2024-05-22 15:13:58.017[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 15:13:58.120[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:15:11.932[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6136714781279886[0m
[32m2024-05-22 15:15:28.667[0m

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.6198600814451289


[32m2024-05-22 15:23:42.566[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 15:23:42.650[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:24:39.230[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6107583313858767[0m
[32m2024-05-22 15:24:52.512[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.618128916667081[0m
[32m2024-05-22 15:25:57.241[0m | [1mINFO    [0m |

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.618128916667081


[32m2024-05-22 15:32:34.102[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 15:32:34.134[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:33:02.279[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5910089649308612[0m
[32m2024-05-22 15:33:11.027[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5961060808716652[0m
[32m2024-05-22 15:33:39.622[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'pitch', 'rms'], Accuracy: 0.5961060808716652


[32m2024-05-22 15:38:16.953[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 15:38:17.045[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:39:22.857[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6148536258330557[0m
[32m2024-05-22 15:39:37.674[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6156720549066794[0m
[32m2024-05-22 15:40:45.166[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6184025550633049


[32m2024-05-22 15:47:42.399[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 15:47:42.490[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:48:48.822[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6106684168916601[0m
[32m2024-05-22 15:49:03.746[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6158532098231377[0m
[32m2024-05-22 15:50:08.741[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6158532098231377


[32m2024-05-22 15:57:13.192[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 15:57:13.285[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:58:18.881[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6095756035872983[0m
[32m2024-05-22 15:58:33.251[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6134882514489907[0m
[32m2024-05-22 15:59:42.021[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.6143081721916431


[32m2024-05-22 16:05:58.885[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:05:58.913[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:06:21.450[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5095553831849123[0m
[32m2024-05-22 16:06:29.414[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5121949744013021[0m
[32m2024-05-22 16:06:51.962[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'pitch', 'rms'], Accuracy: 0.5158357241473039


[32m2024-05-22 16:10:19.897[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:10:19.983[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:11:22.554[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6118505645967274[0m
[32m2024-05-22 16:11:36.383[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6133043618059802[0m
[32m2024-05-22 16:12:35.033[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6174013136631911


[32m2024-05-22 16:18:31.696[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:18:31.783[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:19:34.015[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6090293212408697[0m
[32m2024-05-22 16:19:48.463[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6153092478507535[0m
[32m2024-05-22 16:20:50.507[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6163106549918703


[32m2024-05-22 16:27:02.597[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:27:02.670[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:28:00.207[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6108487431031024[0m
[32m2024-05-22 16:28:14.570[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6073005597073676[0m
[32m2024-05-22 16:29:16.842[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.6146714764705784


[32m2024-05-22 16:35:23.628[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:35:23.660[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:35:54.454[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5858209400498218[0m
[32m2024-05-22 16:36:03.355[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5944680625373954[0m
[32m2024-05-22 16:36:33.403[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'pitch', 'rms'], Accuracy: 0.5947417009336191


[32m2024-05-22 16:40:05.505[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:40:05.542[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:40:37.277[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5839996121660526[0m
[32m2024-05-22 16:40:47.281[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.584731690177028[0m
[32m2024-05-22 16:41:17.563[0m | [1mINFO    [0m |

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'rms'], Accuracy: 0.5870953226231497


[32m2024-05-22 16:44:59.917[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:44:59.952[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:45:28.776[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5813620927122023[0m
[32m2024-05-22 16:45:37.857[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5836385453906597[0m
[32m2024-05-22 16:46:06.386[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'pitch'], Accuracy: 0.5862771421610306


[32m2024-05-22 16:50:09.722[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:50:09.828[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:51:18.226[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6108492403261121[0m
[32m2024-05-22 16:51:33.331[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6104849416011575[0m
[32m2024-05-22 16:52:37.171[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'rms'], Accuracy: 0.6153999910499859


[32m2024-05-22 16:59:40.102[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 16:59:40.187[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:00:38.926[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.606208906590028[0m
[32m2024-05-22 17:00:51.777[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6104865990111893[0m
[32m2024-05-22 17:01:49.436[0m | [1mINFO    [0m |

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'pitch'], Accuracy: 0.61166841523425


[32m2024-05-22 17:08:05.507[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:08:05.603[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:09:08.985[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6069364267234164[0m
[32m2024-05-22 17:09:23.051[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6120317195131856[0m
[32m2024-05-22 17:10:26.243[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr'], Accuracy: 0.6120317195131856


[32m2024-05-22 17:16:27.904[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:16:27.920[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:16:45.540[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4655983830307731[0m
[32m2024-05-22 17:16:53.180[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4642340859632287[0m
[32m2024-05-22 17:17:12.590[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['pitch', 'rms'], Accuracy: 0.4655983830307731


[32m2024-05-22 17:19:20.670[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:19:20.688[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:19:43.284[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.49417494957329977[0m
[32m2024-05-22 17:19:51.625[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4937187474620909[0m
[32m2024-05-22 17:20:14.451[0m | [1mINFO    [0m

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'rms'], Accuracy: 0.4969044552839061


[32m2024-05-22 17:23:07.247[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:23:07.266[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:23:22.625[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.3754109133820943[0m
[32m2024-05-22 17:23:29.795[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.3760475245752473[0m
[32m2024-05-22 17:23:45.250[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'pitch'], Accuracy: 0.3760475245752473


[32m2024-05-22 17:26:16.824[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:26:16.908[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:27:19.888[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6099398194417511[0m
[32m2024-05-22 17:27:34.324[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6122151119331866[0m
[32m2024-05-22 17:28:36.618[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'rms'], Accuracy: 0.6132153588872813


[32m2024-05-22 17:35:21.158[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:35:21.232[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:36:18.285[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6089378322071232[0m
[32m2024-05-22 17:36:31.257[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6131242842060426[0m
[32m2024-05-22 17:37:28.409[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'pitch'], Accuracy: 0.6151275128407843


[32m2024-05-22 17:43:09.192[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:43:09.280[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:44:11.062[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6068446890781651[0m
[32m2024-05-22 17:44:25.704[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6153089163687472[0m
[32m2024-05-22 17:45:21.696[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr'], Accuracy: 0.6153089163687472


[32m2024-05-22 17:50:58.967[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:50:59.001[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:51:30.783[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5759920013391873[0m
[32m2024-05-22 17:51:40.856[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5805443266025911[0m
[32m2024-05-22 17:52:14.394[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'rms'], Accuracy: 0.5849111876834546


[32m2024-05-22 17:55:54.079[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:55:54.103[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:56:17.474[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5803630059451297[0m
[32m2024-05-22 17:56:25.434[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5832739980542007[0m
[32m2024-05-22 17:56:48.736[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'pitch'], Accuracy: 0.5840938359263513


[32m2024-05-22 17:59:41.151[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 17:59:41.181[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:00:09.168[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5716250573878224[0m
[32m2024-05-22 18:00:17.942[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5733550619788481[0m
[32m2024-05-22 18:00:46.046[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr'], Accuracy: 0.5766308500358829


[32m2024-05-22 18:04:34.233[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:04:34.316[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:05:29.808[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5976531073951978[0m
[32m2024-05-22 18:05:42.373[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6076649413028237[0m
[32m2024-05-22 18:06:38.204[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics'], Accuracy: 0.609028078183346


[32m2024-05-22 18:11:34.280[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:11:34.299[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:11:52.039[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4204598152650779[0m
[32m2024-05-22 18:11:58.939[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4149071601770776[0m
[32m2024-05-22 18:12:16.648[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['rms'], Accuracy: 0.4204598152650779


[32m2024-05-22 18:14:23.522[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:14:23.534[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:14:36.063[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.20768093530962908[0m
[32m2024-05-22 18:14:42.171[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.20731721667818565[0m
[32m2024-05-22 18:14:54.677[0m | [1mINFO    [0

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['pitch'], Accuracy: 0.20822738339706076


[32m2024-05-22 18:16:07.723[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:16:07.737[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:16:22.435[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.3387346668854448[0m
[32m2024-05-22 18:16:29.545[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.33136325289922447[0m
[32m2024-05-22 18:16:44.276[0m | [1mINFO    [0m

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr'], Accuracy: 0.34001037538679807


[32m2024-05-22 18:19:02.821[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:19:02.894[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:19:59.135[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6053893173293821[0m
[32m2024-05-22 18:20:11.647[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6074812174008164[0m
[32m2024-05-22 18:21:07.295[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics'], Accuracy: 0.6090293212408697


[32m2024-05-22 18:26:28.376[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:26:28.398[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:26:51.659[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5601576031199086[0m
[32m2024-05-22 18:26:59.669[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.566891825819465[0m
[32m2024-05-22 18:27:22.981[0m | [1mINFO    [0m |

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc'], Accuracy: 0.5694402594841146


[32m2024-05-22 18:29:39.631[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature4.csv[0m
[32m2024-05-22 18:29:39.642[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m


ValueError: at least one array or dtype is required