In [8]:
from audio_preprocessing.cut_audio_segment_from_audio_file import AudioProcessor
from feature_extraction.feature_extractor import FeatureExtractor
from feature_extraction.mfcc_images_extractor import MelSpectrogramImageExtractor
from data_processing.english_data_processing import ModelEvaluator
from itertools import combinations
from sklearn.ensemble import ExtraTreesClassifier
from sklearn.ensemble import RandomForestClassifier
import pandas as pd

In [9]:
def extract_mfcc_images(n_mfcc, figsize, input_folder, output_folder):
    mfccImageExtractor = MelSpectrogramImageExtractor(n_mfcc, figsize)
    mfccImageExtractor.extract_from_folders(input_folder, output_folder)

In [10]:
def cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, input_folder, output_folder):
    segmentation = AudioProcessor(frame_size, hop_size, threshold)
    segmentation.process_folders(input_folder, output_folder)

In [11]:
def extract_feature(n_mfcc, input_folder, output_folder, selected_features):
    featureExtractor = FeatureExtractor(n_mfcc)
    featureExtractor.process_folder(input_folder, output_folder, selected_features)
    # featureExtractor.process_folder(input_folder, output_folder, ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

In [12]:
def model(featured_data):
    models = [RandomForestClassifier, ExtraTreesClassifier]
    
    df_train_test = pd.read_csv(featured_data)
    df_shuffled = df_train_test.sample(frac=1, random_state=42).reset_index(drop=True)

    modelEvaluator = ModelEvaluator(models)
    best_model, best_scaler, best_avg_acc = modelEvaluator.evaluate_models(df_shuffled)
    return best_model, best_scaler, best_avg_acc

In [13]:
def process_data(frame_size, hop_size, threshold, raw_folder, cutted_folder, n_mfcc_list, featured_data_path, n_mfcc_for_images, images_folder, features):
    cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, raw_folder, cutted_folder)
    n = len(features)

    results = []

    for n_mfcc in n_mfcc_list:
        for r in range(0, n + 1):
            for combo in combinations(range(n), r):
                selected_features = [features[i] for i in range(n) if i not in combo]
                extract_feature(n_mfcc, cutted_folder, featured_data_path, selected_features)
                current_model, current_scaler, current_avg_acc = model(featured_data_path)
                print(f"Scaler: {current_scaler}, Model: {current_model}, n_mfcc: {n_mfcc}, Selected features: {selected_features}, Accuracy: {current_avg_acc}")
                results.append({'Scaler': current_scaler, 'Model': current_model, 'N_MFCC': n_mfcc, 'Selected Features': selected_features, 'Average Accuracy': current_avg_acc})

    results_df = pd.DataFrame(results)
    ranked_results = results_df.sort_values(by='Average Accuracy', ascending=False)

    return ranked_results

In [14]:
process_data(256, 128, 0.0005, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/combined_data', 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/cleaned_data0', [13,20,26,40], 'D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv', 100, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/images', ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

  return ste / np.max(ste)
[32m2024-05-22 14:25:15.261[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m148[0m - [1mProcessing input folder: D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/cleaned_data0[0m
[32m2024-05-22 14:28:27.663[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 14:28:27.758[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 14:29:34.615[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6168331269094212[0m
[32m2024-05-22 14:29:50.054[0m

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.6244680868631823


[32m2024-05-22 14:38:33.550[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 14:38:33.631[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 14:39:30.763[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6231932953513335[0m
[32m2024-05-22 14:39:44.104[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6176504004623896[0m
[32m2024-05-22 14:40:44.531[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.6231932953513335


[32m2024-05-22 14:48:04.023[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 14:48:04.058[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 14:48:38.780[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5883865081331021[0m
[32m2024-05-22 14:48:52.820[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5912955990421931[0m
[32m2024-05-22 14:49:35.130[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'pitch', 'rms'], Accuracy: 0.5930222112129468


[32m2024-05-22 14:54:43.140[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 14:54:43.227[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 14:55:51.326[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6221040376517216[0m
[32m2024-05-22 14:56:05.780[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6204683345718769[0m
[32m2024-05-22 14:57:19.389[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6225591610932211


[32m2024-05-22 15:06:37.994[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:06:38.112[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:07:54.742[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6221959375774089[0m
[32m2024-05-22 15:08:11.284[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6210126331434234[0m
[32m2024-05-22 15:09:25.795[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6241955247295847


[32m2024-05-22 15:17:50.752[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:17:50.844[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:18:55.958[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6199243662785897[0m
[32m2024-05-22 15:19:10.352[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6138337874659399[0m
[32m2024-05-22 15:20:22.138[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.6222867640987532


[32m2024-05-22 15:27:04.474[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:27:04.500[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:27:28.129[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5281321938733383[0m
[32m2024-05-22 15:27:36.854[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5315838493931138[0m
[32m2024-05-22 15:28:00.450[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'pitch', 'rms'], Accuracy: 0.5324033523243332


[32m2024-05-22 15:31:38.795[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:31:38.869[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:32:38.342[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6266490793493519[0m
[32m2024-05-22 15:32:51.248[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6235566014367104[0m
[32m2024-05-22 15:33:48.438[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6266490793493519


[32m2024-05-22 15:40:36.878[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:40:36.965[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:41:35.588[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6231958550078441[0m
[32m2024-05-22 15:41:48.711[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6171057716125836[0m
[32m2024-05-22 15:42:46.923[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6232858558335398


[32m2024-05-22 15:49:15.674[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:49:15.753[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:50:14.209[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.621832631492032[0m
[32m2024-05-22 15:50:27.318[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6164693254066551[0m
[32m2024-05-22 15:51:24.901[0m | [1mINFO    [0m |

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.621832631492032


[32m2024-05-22 15:57:50.444[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 15:57:50.477[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 15:58:21.101[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5928400627528692[0m
[32m2024-05-22 15:58:30.634[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5986560151928[0m
[32m2024-05-22 15:59:04.306[0m | [1mINFO    [0m | 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'pitch', 'rms'], Accuracy: 0.6036556849145406


[32m2024-05-22 16:02:54.048[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:02:54.079[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:03:23.533[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.590205267938238[0m
[32m2024-05-22 16:03:33.234[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5892043596730245[0m
[32m2024-05-22 16:04:05.057[0m | [1mINFO    [0m |

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'rms'], Accuracy: 0.5932020477252086


[32m2024-05-22 16:08:08.115[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:08:08.151[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:08:38.589[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5867513830402113[0m
[32m2024-05-22 16:08:48.225[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5817513004706466[0m
[32m2024-05-22 16:09:20.544[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr', 'pitch'], Accuracy: 0.5905677483279663


[32m2024-05-22 16:13:40.796[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:13:40.885[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:14:46.744[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6217394930228718[0m
[32m2024-05-22 16:15:00.712[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6187407315663446[0m
[32m2024-05-22 16:16:07.896[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'rms'], Accuracy: 0.6230125505738585


[32m2024-05-22 16:23:42.949[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:23:43.037[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:24:42.645[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6162879200726612[0m
[32m2024-05-22 16:24:57.096[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6149251919742383[0m
[32m2024-05-22 16:25:59.536[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'pitch'], Accuracy: 0.621194203616547


[32m2024-05-22 16:32:41.136[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:32:41.220[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:33:46.249[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6125604822062589[0m
[32m2024-05-22 16:34:00.522[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6128342003137645[0m
[32m2024-05-22 16:35:09.202[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics', 'zcr'], Accuracy: 0.6172875072248368


[32m2024-05-22 16:41:30.367[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:41:30.383[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:41:47.380[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4712360663859302[0m
[32m2024-05-22 16:41:54.521[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4674186276938321[0m
[32m2024-05-22 16:42:12.003[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['pitch', 'rms'], Accuracy: 0.4737799521096524


[32m2024-05-22 16:44:17.283[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:44:17.304[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:44:40.872[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5174958302369747[0m
[32m2024-05-22 16:44:49.943[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5142252497729338[0m
[32m2024-05-22 16:45:12.776[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'rms'], Accuracy: 0.5209515316654281


[32m2024-05-22 16:48:06.700[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:48:06.725[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:48:23.401[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4159817521261663[0m
[32m2024-05-22 16:48:31.189[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.41779803484435635[0m
[32m2024-05-22 16:48:47.990[0m | [1mINFO    [0m

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['zcr', 'pitch'], Accuracy: 0.4241602675253901


[32m2024-05-22 16:51:30.653[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 16:51:30.733[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 16:52:29.768[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6201940384774173[0m
[32m2024-05-22 16:52:43.162[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6197387498967879[0m
[32m2024-05-22 16:53:42.431[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'rms'], Accuracy: 0.6215582528280076


[32m2024-05-22 17:00:05.253[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:00:05.323[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:01:03.650[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6191041202212865[0m
[32m2024-05-22 17:01:17.006[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6194693254066551[0m
[32m2024-05-22 17:02:16.528[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'pitch'], Accuracy: 0.6222848649987613


[32m2024-05-22 17:08:17.818[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:08:17.895[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:09:15.749[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6161065973082323[0m
[32m2024-05-22 17:09:29.241[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6128351085789778[0m
[32m2024-05-22 17:10:27.580[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics', 'zcr'], Accuracy: 0.6181971761208819


[32m2024-05-22 17:16:20.862[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:16:20.893[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:16:52.819[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5834786557674841[0m
[32m2024-05-22 17:17:02.731[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5902959293204525[0m
[32m2024-05-22 17:17:36.546[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'rms'], Accuracy: 0.5902959293204525


[32m2024-05-22 17:21:33.112[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:21:33.139[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:21:59.394[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5842062587730161[0m
[32m2024-05-22 17:22:08.276[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5803881595243994[0m
[32m2024-05-22 17:22:34.473[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'pitch'], Accuracy: 0.5887500619271737


[32m2024-05-22 17:25:39.937[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:25:39.977[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:26:11.603[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5808428701180745[0m
[32m2024-05-22 17:26:21.863[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5705746841714144[0m
[32m2024-05-22 17:26:54.253[0m | [1mINFO    [0m 

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'zcr'], Accuracy: 0.5820251837172818


[32m2024-05-22 17:31:47.909[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:31:47.988[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:32:47.231[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.61546940797622[0m
[32m2024-05-22 17:33:00.337[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6104722153414252[0m
[32m2024-05-22 17:34:01.175[0m | [1mINFO    [0m | 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc', 'mfcc_statistics'], Accuracy: 0.6162873420857073


[32m2024-05-22 17:39:22.823[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:39:22.844[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:39:40.546[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.4274285360416151[0m
[32m2024-05-22 17:39:47.910[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4242483692510941[0m
[32m2024-05-22 17:40:06.382[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['rms'], Accuracy: 0.4302479564032697


[32m2024-05-22 17:42:27.497[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:42:27.510[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:42:41.809[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.21839559078523654[0m
[32m2024-05-22 17:42:49.000[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.21839592106349598[0m
[32m2024-05-22 17:43:03.348[0m | [1mINFO    [0

Scaler: StandardScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['pitch'], Accuracy: 0.21857740896705474


[32m2024-05-22 17:44:28.107[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:44:28.127[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:44:43.090[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.3903502600941293[0m
[32m2024-05-22 17:44:50.294[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.38589587977871354[0m
[32m2024-05-22 17:45:05.266[0m | [1mINFO    [0m

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['zcr'], Accuracy: 0.3918048881182396


[32m2024-05-22 17:47:29.794[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:47:29.875[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:48:30.753[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6101963504252332[0m
[32m2024-05-22 17:48:43.937[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6121984972339196[0m
[32m2024-05-22 17:49:43.444[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 13, Selected features: ['mfcc_statistics'], Accuracy: 0.6125600693584344


[32m2024-05-22 17:55:32.744[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:55:32.767[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-22 17:55:57.769[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5674838576500703[0m
[32m2024-05-22 17:56:05.962[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5711189827429608[0m
[32m2024-05-22 17:56:30.166[0m | [1mINFO    [0m 

Scaler: MaxAbsScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 13, Selected features: ['mfcc'], Accuracy: 0.5755707208323012


[32m2024-05-22 17:58:50.926[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature2.csv[0m
[32m2024-05-22 17:58:50.937[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m


ValueError: at least one array or dtype is required