In [1]:
from config.vi_config import VietnameseDatasetConfig
from config.eng_config import Config
from src.data_preparation_runner import DataPreparationRunner
from src.data_preprocessing_runner import DataPreprocessingRunner
from src.feature_extraction_runner import FeatureExtractionRunner
from src.mel_spectrogram_extraction_runner import MelSpectrogramExtractionRunner

In [2]:
class AudioFeaturePipeline:
    def __init__(self, config):
        self.config = config
        self.data_preparation_runner = DataPreparationRunner(config)
        self.data_preprocessing_runner = DataPreprocessingRunner(config)
        self.feature_extraction_runner = FeatureExtractionRunner(config)
        self.mel_spectrogram_extraction_runner = MelSpectrogramExtractionRunner(config)

    def run(self):
        self.data_preparation_runner.run()
        self.data_preprocessing_runner.run()
        self.feature_extraction_runner.run()
        self.mel_spectrogram_extraction_runner.run()

**Pineline chuan bi du lieu --> Tien xu ly du lieu --> Trich xuat dac trung Statistics --> Trich xuat anh Mel Spectrogram cho tieng Anh**

In [3]:
# config = Config()
# pipeline = AudioFeaturePipeline(config)
# pipeline.run()

**Pineline chuan bi du lieu --> Tien xu ly du lieu --> Trich xuat dac trung Statistics --> Trich xuat anh Mel Spectrogram cho tieng Viet**

In [4]:
config = VietnameseDatasetConfig()
pipeline = AudioFeaturePipeline(config)
pipeline.run()

[32m2024-06-23 04:32:20.227[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.train_test_validation_split[0m:[36mprocess_folders[0m:[36m22[0m - [1mProcessing: Splitting files into train, test, and validation sets.[0m


Splitting data into train, test, and validation sets...


[32m2024-06-23 04:32:20.573[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36mprocess_folders[0m:[36m79[0m - [1mProcessing: D:/data_analysis/speech_emotion_recognition/data/VietnameseDataset/train_test_splited_data/raw/train[0m
[32m2024-06-23 04:32:20.573[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36m_process_folder[0m:[36m60[0m - [1mProcessing folder: Angry[0m


Augmenting audio and extracting file paths...


[32m2024-06-23 04:32:22.567[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36m_process_folder[0m:[36m60[0m - [1mProcessing folder: Disgusted[0m
[32m2024-06-23 04:32:23.379[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36m_process_folder[0m:[36m60[0m - [1mProcessing folder: Fearful[0m
[32m2024-06-23 04:32:24.033[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36m_process_folder[0m:[36m60[0m - [1mProcessing folder: Happy[0m
[32m2024-06-23 04:32:24.809[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36m_process_folder[0m:[36m60[0m - [1mProcessing folder: Neutral[0m
[32m2024-06-23 04:32:25.522[0m | [1mINFO    [0m | [36mmodules.preparing.scripts.augment_audio_and_extract_file_path[0m:[36m_process_folder[0m:[36m60[0m - [1mProcessing folder: Sad[0m
[32m2024

Data preparation completed.


[32m2024-06-23 04:32:45.218[0m | [1mINFO    [0m | [36mmodules.pre_processing.scripts.pre_processing_data[0m:[36mprocess_and_save_audio_files[0m:[36m57[0m - [1mProcessed 1000 files in train dataset.[0m
[32m2024-06-23 04:32:50.019[0m | [1mINFO    [0m | [36mmodules.pre_processing.scripts.pre_processing_data[0m:[36mprocess_and_save_audio_files[0m:[36m57[0m - [1mProcessed 0 files in test dataset.[0m
[32m2024-06-23 04:32:53.590[0m | [1mINFO    [0m | [36mmodules.pre_processing.scripts.pre_processing_data[0m:[36mprocess_and_save_audio_files[0m:[36m57[0m - [1mProcessed 0 files in validation dataset.[0m


Running feature extraction for train dataset...


[32m2024-06-23 04:32:58.922[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 0 file.[0m
[32m2024-06-23 04:33:38.524[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 100 file.[0m
[32m2024-06-23 04:34:17.679[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 200 file.[0m
[32m2024-06-23 04:34:56.863[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 300 file.[0m
[32m2024-06-23 04:35:35.930[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 400 file.[0m
[32m2024-06-23 04:36:14.787[0m | [1mINF

Feature extraction for train dataset completed.
Running feature extraction for test dataset...


[32m2024-06-23 04:43:25.744[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 0 file.[0m
[32m2024-06-23 04:44:11.120[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 100 file.[0m
[32m2024-06-23 04:44:56.515[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 200 file.[0m


Feature extraction for test dataset completed.
Running feature extraction for validation dataset...


[32m2024-06-23 04:45:32.304[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 0 file.[0m
[32m2024-06-23 04:46:17.419[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 100 file.[0m
[32m2024-06-23 04:47:04.742[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 200 file.[0m
[32m2024-06-23 04:47:55.913[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 300 file.[0m
[32m2024-06-23 04:48:45.748[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_statistic_features[0m:[36mprocess_folder[0m:[36m165[0m - [1mProcessed 400 file.[0m
[32m2024-06-23 04:49:13.471[0m | [1mINF

Feature extraction for validation dataset completed.
Extracting Mel spectrogram for train dataset...


[32m2024-06-23 04:49:13.736[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 4 files![0m
[32m2024-06-23 04:49:13.804[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 5 files![0m
[32m2024-06-23 04:49:13.859[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 6 files![0m
[32m2024-06-23 04:49:13.922[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 7 files![0m
[32m2024-06-23 04:49:14.012[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 8 files![0m
[32m2024-06-23 04:49:14.089[0m | [1mINFO    [0m | [36mmodule

Mel spectrogram extraction for train dataset completed.
Extracting Mel spectrogram for test dataset...


[32m2024-06-23 04:51:09.410[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 3 files![0m
[32m2024-06-23 04:51:09.505[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 4 files![0m
[32m2024-06-23 04:51:09.569[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 5 files![0m
[32m2024-06-23 04:51:09.623[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 6 files![0m
[32m2024-06-23 04:51:09.677[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 7 files![0m
[32m2024-06-23 04:51:09.732[0m | [1mINFO    [0m | [36mmodule

Mel spectrogram extraction for test dataset completed.
Extracting Mel spectrogram for validation dataset...


[32m2024-06-23 04:51:30.674[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 3 files![0m
[32m2024-06-23 04:51:30.769[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 4 files![0m
[32m2024-06-23 04:51:30.882[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 5 files![0m
[32m2024-06-23 04:51:30.970[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 6 files![0m
[32m2024-06-23 04:51:31.058[0m | [1mINFO    [0m | [36mmodules.extracting_feature.scripts.extract_mel_spectrogram[0m:[36mprocess_folder[0m:[36m55[0m - [1mProcessed 7 files![0m
[32m2024-06-23 04:51:31.144[0m | [1mINFO    [0m | [36mmodule

Mel spectrogram extraction for validation dataset completed.
