In [15]:
from audio_preprocessing.cut_audio_segment_from_audio_file import AudioProcessor
from feature_extraction.feature_extractor import FeatureExtractor
from feature_extraction.mfcc_images_extractor import MelSpectrogramImageExtractor
from data_processing.english_data_processing import ModelEvaluator
from itertools import combinations
from sklearn.ensemble import ExtraTreesClassifier
from sklearn.ensemble import RandomForestClassifier
import pandas as pd

In [16]:
def extract_mfcc_images(n_mfcc, figsize, input_folder, output_folder):
    mfccImageExtractor = MelSpectrogramImageExtractor(n_mfcc, figsize)
    mfccImageExtractor.extract_from_folders(input_folder, output_folder)

In [17]:
def cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, input_folder, output_folder):
    segmentation = AudioProcessor(frame_size, hop_size, threshold)
    segmentation.process_folders(input_folder, output_folder)

In [18]:
def extract_feature(n_mfcc, input_folder, output_folder, selected_features):
    featureExtractor = FeatureExtractor(n_mfcc)
    featureExtractor.process_folder(input_folder, output_folder, selected_features)
    # featureExtractor.process_folder(input_folder, output_folder, ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

In [19]:
def model(featured_data):
    models = [RandomForestClassifier, ExtraTreesClassifier]
    
    df_train_test = pd.read_csv(featured_data)
    df_shuffled = df_train_test.sample(frac=1, random_state=42).reset_index(drop=True)

    modelEvaluator = ModelEvaluator(models)
    best_model, best_scaler, best_avg_acc = modelEvaluator.evaluate_models(df_shuffled)
    return best_model, best_scaler, best_avg_acc

In [20]:
def process_data(frame_size, hop_size, threshold, raw_folder, cutted_folder, n_mfcc_list, featured_data_path, n_mfcc_for_images, images_folder, features):
    cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, raw_folder, cutted_folder)
    n = len(features)

    results = []

    for n_mfcc in n_mfcc_list:
        for r in range(0, n + 1):
            for combo in combinations(range(n), r):
                selected_features = [features[i] for i in range(n) if i not in combo]
                extract_feature(n_mfcc, cutted_folder, featured_data_path, selected_features)
                current_model, current_scaler, current_avg_acc = model(featured_data_path)
                print(f"Scaler: {current_scaler}, Model: {current_model}, n_mfcc: {n_mfcc}, Selected features: {selected_features}, Accuracy: {current_avg_acc}")
                results.append({'Scaler': current_scaler, 'Model': current_model, 'N_MFCC': n_mfcc, 'Selected Features': selected_features, 'Average Accuracy': current_avg_acc})

    results_df = pd.DataFrame(results)
    ranked_results = results_df.sort_values(by='Average Accuracy', ascending=False)

    return ranked_results

In [21]:
process_data(256, 128, 0.005, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/combined_data', 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/cleaned_data1', [13,20,26,40], 'D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv', 100, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/images', ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

  return ste / np.max(ste)
[32m2024-05-22 14:57:20.534[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m148[0m - [1mProcessing input folder: D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/cleaned_data1[0m
[32m2024-05-22 15:00:13.179[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:00:13.324[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:01:46.424[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.622307241350838[0m
[32m2024-05-22 15:02:01.453[0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.6249448435306746


[32m2024-05-22 15:11:27.743[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:11:27.832[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:12:39.313[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.620762612501032[0m
[32m2024-05-22 15:12:55.217[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6158552555528033[0m
[32m2024-05-22 15:14:03.683[0m | [1mINFO    [0m |

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.6256724465362068


[32m2024-05-22 15:20:52.184[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:20:52.217[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:21:21.735[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5923115349682109[0m
[32m2024-05-22 15:21:30.882[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5926749236231525[0m
[32m2024-05-22 15:22:00.797[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'pitch', 'rms'], Accuracy: 0.5964918668978614


[32m2024-05-22 15:26:41.566[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:26:41.672[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:27:51.369[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6196719511188176[0m
[32m2024-05-22 15:28:05.611[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6220340186607217[0m
[32m2024-05-22 15:29:14.420[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6253074064899679


[32m2024-05-22 15:36:58.051[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:36:58.165[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:38:08.022[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6214897200891751[0m
[32m2024-05-22 15:38:23.090[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6193994715547848[0m
[32m2024-05-22 15:39:29.326[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6231268268516226


[32m2024-05-22 15:46:45.026[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:46:45.132[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:47:54.589[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6163089753117001[0m
[32m2024-05-22 15:48:09.024[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6179450912393692[0m
[32m2024-05-22 15:49:18.792[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.6227619519445132


[32m2024-05-22 15:55:34.271[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 15:55:34.298[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:55:58.483[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5198614482701677[0m
[32m2024-05-22 15:56:07.406[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.524315993724713[0m
[32m2024-05-22 15:56:31.654[0m | [1mINFO    [0m |

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'pitch', 'rms'], Accuracy: 0.5284081413590951


[32m2024-05-22 16:00:03.522[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:00:03.615[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:01:05.553[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6195811245974733[0m
[32m2024-05-22 16:01:18.668[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6246723639666418[0m
[32m2024-05-22 16:02:18.859[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6246723639666418


[32m2024-05-22 16:08:24.888[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:08:24.969[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:09:25.833[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6186728593840309[0m
[32m2024-05-22 16:09:40.108[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6162179836512262[0m
[32m2024-05-22 16:10:43.536[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6211266617124929


[32m2024-05-22 16:16:58.758[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:16:58.835[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:17:57.695[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6204897200891751[0m
[32m2024-05-22 16:18:11.503[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.618670547436215[0m
[32m2024-05-22 16:19:13.579[0m | [1mINFO    [0m |

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.6204897200891751


[32m2024-05-22 16:25:34.494[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:25:34.526[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:26:05.938[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5931274874081414[0m
[32m2024-05-22 16:26:15.621[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5974017009330361[0m
[32m2024-05-22 16:26:47.981[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'pitch', 'rms'], Accuracy: 0.5974017009330361


[32m2024-05-22 16:30:35.187[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:30:35.222[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:31:04.608[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5862205433077368[0m
[32m2024-05-22 16:31:13.650[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5856746759144579[0m
[32m2024-05-22 16:31:45.650[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'rms'], Accuracy: 0.5883112046899512


[32m2024-05-22 16:35:41.620[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:35:41.653[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:36:10.573[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5851293865081331[0m
[32m2024-05-22 16:36:19.594[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.58594748575675[0m
[32m2024-05-22 16:36:48.749[0m | [1mINFO    [0m | 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'pitch'], Accuracy: 0.5865841796713731


[32m2024-05-22 16:40:51.494[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:40:51.579[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:41:57.641[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6188547601354142[0m
[32m2024-05-22 16:42:11.337[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6183088101725704[0m
[32m2024-05-22 16:43:16.318[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'rms'], Accuracy: 0.6189453389480637


[32m2024-05-22 16:50:32.172[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:50:32.253[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:51:34.359[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6151268268516226[0m
[32m2024-05-22 16:51:47.382[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6194900503674345[0m
[32m2024-05-22 16:52:45.970[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'pitch'], Accuracy: 0.6201260837255387


[32m2024-05-22 16:59:08.903[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 16:59:08.996[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:00:17.744[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6190353397737594[0m
[32m2024-05-22 17:00:31.565[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6139440178350261[0m
[32m2024-05-22 17:01:36.341[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr'], Accuracy: 0.6193080670464867


[32m2024-05-22 17:07:49.218[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:07:49.235[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:08:07.999[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4661403682602593[0m
[32m2024-05-22 17:08:15.686[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4614152423416729[0m
[32m2024-05-22 17:08:33.096[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['pitch', 'rms'], Accuracy: 0.46823334159028984


[32m2024-05-22 17:10:33.748[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:10:33.765[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:10:56.620[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.499135826934192[0m
[32m2024-05-22 17:11:04.816[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5039540087523738[0m
[32m2024-05-22 17:11:27.404[0m | [1mINFO    [0m |

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'rms'], Accuracy: 0.5061356617950623


[32m2024-05-22 17:14:21.208[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:14:21.226[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:14:36.416[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4071442490298076[0m
[32m2024-05-22 17:14:43.465[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.39859978531913137[0m
[32m2024-05-22 17:14:58.809[0m | [1mINFO    [0m

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'pitch'], Accuracy: 0.4071442490298076


[32m2024-05-22 17:17:32.987[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:17:33.068[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:18:36.233[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6193080670464867[0m
[32m2024-05-22 17:18:50.215[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6193998018330443[0m
[32m2024-05-22 17:19:49.191[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'rms'], Accuracy: 0.6210355874824539


[32m2024-05-22 17:26:01.487[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:26:01.571[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:27:05.760[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6233991412765255[0m
[32m2024-05-22 17:27:20.566[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6173087276030056[0m
[32m2024-05-22 17:28:24.303[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'pitch'], Accuracy: 0.6233991412765255


[32m2024-05-22 17:35:05.577[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:35:05.655[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:36:03.637[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6125813723061679[0m
[32m2024-05-22 17:36:16.636[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6124919494674262[0m
[32m2024-05-22 17:37:14.172[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr'], Accuracy: 0.6167625299314673


[32m2024-05-22 17:42:55.903[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:42:55.936[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:43:29.496[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5803121129551647[0m
[32m2024-05-22 17:43:39.378[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5826746759144579[0m
[32m2024-05-22 17:44:13.532[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'rms'], Accuracy: 0.586492775163075


[32m2024-05-22 17:48:02.511[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:48:02.549[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:48:25.982[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5861299644950873[0m
[32m2024-05-22 17:48:33.938[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5847652547271076[0m
[32m2024-05-22 17:48:57.542[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'pitch'], Accuracy: 0.588492114606556


[32m2024-05-22 17:51:59.658[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:51:59.689[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:52:31.575[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5779478160350094[0m
[32m2024-05-22 17:52:40.740[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5742214515729502[0m
[32m2024-05-22 17:53:10.430[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr'], Accuracy: 0.5794931880108992


[32m2024-05-22 17:57:07.625[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 17:57:07.708[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:58:04.943[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6068545949962845[0m
[32m2024-05-22 17:58:17.796[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.611762695070597[0m
[32m2024-05-22 17:59:15.640[0m | [1mINFO    [0m |

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics'], Accuracy: 0.6171252580298902


[32m2024-05-22 18:04:18.952[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 18:04:18.966[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:04:36.454[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.41823507555115186[0m
[32m2024-05-22 18:04:43.319[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.41669052927091077[0m
[32m2024-05-22 18:05:00.716[0m | [1mINFO    [0

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['rms'], Accuracy: 0.4205068119891008


[32m2024-05-22 18:07:11.411[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 18:07:11.423[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:07:24.028[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.21361613409297334[0m
[32m2024-05-22 18:07:30.193[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.2142527454380315[0m
[32m2024-05-22 18:07:42.876[0m | [1mINFO    [0m

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['pitch'], Accuracy: 0.2155254727107588


[32m2024-05-22 18:08:57.264[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 18:08:57.279[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:09:11.921[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.3706927586491619[0m
[32m2024-05-22 18:09:18.958[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.3606028403930311[0m
[32m2024-05-22 18:09:33.623[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr'], Accuracy: 0.3706927586491619


[32m2024-05-22 18:11:52.812[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 18:11:52.884[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:12:49.508[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.610672941953596[0m
[32m2024-05-22 18:13:01.862[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6149447609611097[0m
[32m2024-05-22 18:13:58.798[0m | [1mINFO    [0m |

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics'], Accuracy: 0.6168545949962844


[32m2024-05-22 18:19:24.559[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 18:19:24.579[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 18:19:47.667[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5682209561555611[0m
[32m2024-05-22 18:19:55.401[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5710388902650483[0m
[32m2024-05-22 18:20:18.495[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc'], Accuracy: 0.5717660804227562


[32m2024-05-22 18:22:34.835[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature3.csv[0m
[32m2024-05-22 18:22:34.845[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m


ValueError: at least one array or dtype is required