In [1]:
from audio_preprocessing.cut_audio_segment_from_audio_file import AudioProcessor
from feature_extraction.feature_extractor import FeatureExtractor
from feature_extraction.mfcc_images_extractor import MelSpectrogramImageExtractor
from data_processing.english_data_processing import ModelEvaluator
from itertools import combinations
from sklearn.ensemble import ExtraTreesClassifier
from sklearn.ensemble import RandomForestClassifier
import pandas as pd

In [2]:
def extract_mfcc_images(n_mfcc, figsize, input_folder, output_folder):
    mfccImageExtractor = MelSpectrogramImageExtractor(n_mfcc, figsize)
    mfccImageExtractor.extract_from_folders(input_folder, output_folder)

In [3]:
def cut_audio_segment_from_audio_file(frame_size, hop_size, threshold, input_folder, output_folder):
    segmentation = AudioProcessor(frame_size, hop_size, threshold)
    segmentation.process_folders(input_folder, output_folder)

In [4]:
def extract_feature(n_mfcc, input_folder, output_folder, selected_features):
    featureExtractor = FeatureExtractor(n_mfcc)
    featureExtractor.process_folder(input_folder, output_folder, selected_features)
    # featureExtractor.process_folder(input_folder, output_folder, ['mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'])

In [5]:
def model(featured_data):
    models = [RandomForestClassifier, ExtraTreesClassifier]
    
    df_train_test = pd.read_csv(featured_data)
    df_shuffled = df_train_test.sample(frac=1, random_state=42).reset_index(drop=True)

    modelEvaluator = ModelEvaluator(models)
    best_model, best_scaler, best_avg_acc = modelEvaluator.evaluate_models(df_shuffled)
    return best_model, best_scaler, best_avg_acc

In [6]:
def process_data(frame_size, hop_size, threshold, raw_folder, cutted_folder, n_mfcc_list, featured_data_path, n_mfcc_for_images, images_folder, features):
    n = len(features)

    results = []

    for n_mfcc in n_mfcc_list:
        for r in range(0, n):
            for combo in combinations(range(n), r):
                selected_features = [features[i] for i in range(n) if i not in combo]
                print(selected_features)
                extract_feature(n_mfcc, cutted_folder, featured_data_path, selected_features)
                current_model, current_scaler, current_avg_acc = model(featured_data_path)
                print(f"Scaler: {current_scaler}, Model: {current_model}, n_mfcc: {n_mfcc}, Selected features: {selected_features}, Accuracy: {current_avg_acc}")
                results.append({'Scaler': current_scaler, 'Model': current_model, 'N_MFCC': n_mfcc, 'Selected Features': selected_features, 'Average Accuracy': current_avg_acc})

    results_df = pd.DataFrame(results)
    ranked_results = results_df.sort_values(by='Average Accuracy', ascending=False)

    return ranked_results

In [7]:
#'mfcc','mfcc_statistics', 'zcr', 'pitch', 'rms'
ranked_results = process_data(256, 128, 0.001, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/combined_data', 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/combined_data', [26], 'D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv', 100, 'D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/images', ['mfcc_statistics', 'zcr', 'pitch', 'rms'])

[32m2024-05-23 03:23:18.530[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m148[0m - [1mProcessing input folder: D:/data_analysis/speech_emotion_recognition/data/EnglishDataset/combined_data[0m


['mfcc_statistics', 'zcr', 'pitch', 'rms']


[32m2024-05-23 03:25:48.685[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 03:25:48.889[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 03:27:18.363[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.633006244424621[0m
[32m2024-05-23 03:27:36.305[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6339875111507582[0m
[32m2024-05-23 03:29:05.464[0m | [1mINFO    [0m |

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'zcr', 'pitch', 'rms'], Accuracy: 0.6372881355932203
['zcr', 'pitch', 'rms']


[32m2024-05-23 03:39:02.398[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 03:39:02.424[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 03:39:34.662[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5272078501338091[0m
[32m2024-05-23 03:39:45.391[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5254237288135594[0m
[32m2024-05-23 03:40:10.145[0m | [1mINFO    [0m 

Scaler: MinMaxScaler, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 26, Selected features: ['zcr', 'pitch', 'rms'], Accuracy: 0.5304192685102587
['mfcc_statistics', 'pitch', 'rms']


[32m2024-05-23 03:44:51.996[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 03:44:52.132[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 03:46:29.084[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6351471900089206[0m
[32m2024-05-23 03:46:51.707[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6300624442462087[0m
[32m2024-05-23 03:48:48.095[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'pitch', 'rms'], Accuracy: 0.6351471900089206
['mfcc_statistics', 'zcr', 'rms']


[32m2024-05-23 03:58:41.952[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 03:58:42.093[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:00:08.937[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.631757359500446[0m
[32m2024-05-23 04:00:25.460[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6276538804638716[0m
[32m2024-05-23 04:01:56.237[0m | [1mINFO    [0m |

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'zcr', 'rms'], Accuracy: 0.6337198929527207
['mfcc_statistics', 'zcr', 'pitch']


[32m2024-05-23 04:10:24.417[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:10:24.566[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:11:50.934[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6300624442462087[0m
[32m2024-05-23 04:12:07.009[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.627029438001784[0m
[32m2024-05-23 04:13:33.819[0m | [1mINFO    [0m |

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'zcr', 'pitch'], Accuracy: 0.6347011596788581
['pitch', 'rms']


[32m2024-05-23 04:21:19.983[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:21:19.998[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:21:38.367[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.47047279214986626[0m
[32m2024-05-23 04:21:45.381[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4732381801962534[0m
[32m2024-05-23 04:22:03.994[0m | [1mINFO    [0m

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 26, Selected features: ['pitch', 'rms'], Accuracy: 0.4732381801962534
['zcr', 'rms']


[32m2024-05-23 04:24:12.380[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:24:12.409[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:24:36.495[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.5101694915254237[0m
[32m2024-05-23 04:24:44.815[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.5159678858162355[0m
[32m2024-05-23 04:25:09.287[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.ExtraTreesClassifier'>, n_mfcc: 26, Selected features: ['zcr', 'rms'], Accuracy: 0.5159678858162355
['zcr', 'pitch']


[32m2024-05-23 04:28:09.703[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:28:09.719[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:28:26.070[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.41757359500446034[0m
[32m2024-05-23 04:28:33.246[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4159678858162355[0m
[32m2024-05-23 04:28:49.558[0m | [1mINFO    [0m

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['zcr', 'pitch'], Accuracy: 0.41757359500446034
['mfcc_statistics', 'rms']


[32m2024-05-23 04:31:31.186[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:31:31.322[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:32:59.494[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6265834076717216[0m
[32m2024-05-23 04:33:15.795[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6275646743978591[0m
[32m2024-05-23 04:34:43.473[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'rms'], Accuracy: 0.6304192685102586
['mfcc_statistics', 'pitch']


[32m2024-05-23 04:43:08.632[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:43:08.770[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:44:35.860[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6316681534344336[0m
[32m2024-05-23 04:44:51.916[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6248884924174843[0m
[32m2024-05-23 04:46:18.352[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'pitch'], Accuracy: 0.6316681534344336
['mfcc_statistics', 'zcr']


[32m2024-05-23 04:54:21.357[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 04:54:21.486[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 04:55:48.669[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6275646743978591[0m
[32m2024-05-23 04:56:04.997[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.6199821587867975[0m
[32m2024-05-23 04:57:31.623[0m | [1mINFO    [0m 

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics', 'zcr'], Accuracy: 0.6275646743978591
['rms']


[32m2024-05-23 05:04:49.355[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 05:04:49.370[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 05:05:08.468[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.42506690454950935[0m
[32m2024-05-23 05:05:15.883[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.4248884924174844[0m
[32m2024-05-23 05:05:35.923[0m | [1mINFO    [0m

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['rms'], Accuracy: 0.4293487957181089
['pitch']


[32m2024-05-23 05:08:04.315[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 05:08:04.326[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 05:08:17.783[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.21097234611953614[0m
[32m2024-05-23 05:08:24.272[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.20856378233719894[0m
[32m2024-05-23 05:08:37.702[0m | [1mINFO    [0

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['pitch'], Accuracy: 0.21097234611953614
['zcr']


[32m2024-05-23 05:09:56.907[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 05:09:56.922[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 05:10:12.500[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.3868867082961641[0m
[32m2024-05-23 05:10:19.709[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.3813559322033898[0m
[32m2024-05-23 05:10:35.262[0m | [1mINFO    [0m 

Scaler: RobustScaler, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['zcr'], Accuracy: 0.3870651204281891
['mfcc_statistics']


[32m2024-05-23 05:13:06.933[0m | [1mINFO    [0m | [36mfeature_extraction.feature_extractor[0m:[36mprocess_folder[0m:[36m158[0m - [1mFeature extraction completed. Data saved to: D:/data_analysis/speech_emotion_recognition/notebooks/feature1.csv[0m
[32m2024-05-23 05:13:07.066[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m53[0m - [1mFinding best model....[0m
[32m2024-05-23 05:14:34.635[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.RandomForestClassifier'> - scaler: None, accuracy: 0.6264942016057091[0m
[32m2024-05-23 05:14:50.879[0m | [1mINFO    [0m | [36mdata_processing.english_data_processing[0m:[36mevaluate_models[0m:[36m74[0m - [1mModel <class 'sklearn.ensemble._forest.ExtraTreesClassifier'> - scaler: None, accuracy: 0.623728813559322[0m
[32m2024-05-23 05:16:26.213[0m | [1mINFO    [0m |

Scaler: None, Model: <class 'sklearn.ensemble._forest.RandomForestClassifier'>, n_mfcc: 26, Selected features: ['mfcc_statistics'], Accuracy: 0.6264942016057091


In [11]:
ranked_results.head(30)

Unnamed: 0,Scaler,Model,N_MFCC,Selected Features,Average Accuracy
0,RobustScaler,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, zcr, pitch, rms]",0.637288
2,,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, pitch, rms]",0.635147
4,RobustScaler,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, zcr, pitch]",0.634701
3,RobustScaler,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, zcr, rms]",0.63372
9,,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, pitch]",0.631668
8,RobustScaler,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, rms]",0.630419
10,,<class 'sklearn.ensemble._forest.RandomForestC...,26,"[mfcc_statistics, zcr]",0.627565
14,,<class 'sklearn.ensemble._forest.RandomForestC...,26,[mfcc_statistics],0.626494
1,MinMaxScaler,<class 'sklearn.ensemble._forest.ExtraTreesCla...,26,"[zcr, pitch, rms]",0.530419
6,,<class 'sklearn.ensemble._forest.ExtraTreesCla...,26,"[zcr, rms]",0.515968
