In [None]:
# Siri Mel Spectrograms

# Importing required libraries
import librosa
import matplotlib.pyplot as plt
import numpy as np
import os

# Loading siri audio files
for file in os.listdir("padded_siri_audio"):
    if not ".DS_Store" in file:
        if not ".ipynb_checkpoints" in file:
            audio_file = f"padded_siri_audio/{file}"
            y, sr = librosa.load(audio_file) # y is amplitude, sr is frequency

            # Calculations for Mel Spectrograms
            n_fft = 2048 # frequency resolution
            hop_length = 512 # temporal resolution
            n_mels = 128 # number of frequency bands used to represent the spectrum
            
            # Creating Mel Spectrogram
            S = librosa.feature.melspectrogram(y=y, sr=sr, n_fft=n_fft, hop_length=hop_length, n_mels=n_mels)

            # Convert power spectrogram to dB scale (logarithmic scale)
            S_db = librosa.power_to_db(S, ref=np.max)

            # Plotting the Mel Spectrograms
            plt.figure(figsize=(10, 4))
            im = librosa.display.specshow(S_db, sr=sr, hop_length=hop_length)
            # plt.title(f"Mel Spectrogram {file}")
            plt.tight_layout()

            # Draw colorbar
            # cbar_ax = plt.gcf().add_axes([0.2, 0, 0.6, 0.05])
            # cbar = plt.colorbar(im, format="%+2.0f dB", cax=cbar_ax, orientation="horizontal")
            # cbar.ax.set_xlabel("dB")
            
            # Saving Mel Spectrograms
            plt.savefig(f"{file[:len(file)-4]}_img.png", bbox_inches='tight', pad_inches=0)
            plt.show()

In [None]:
# not_siri Mel Spectrograms

# Importing required libraries
import librosa
import matplotlib.pyplot as plt
import numpy as np
import os

# Loading audio files
for file in os.listdir("padded_not_siri_audio"):
    if not ".DS_Store" in file:
        if not ".ipynb_checkpoints" in file:
            audio_file = f"padded_not_siri_audio/{file}"
            y, sr = librosa.load(audio_file) # y is amplitude, sr is frequency

            # Calculations for Mel Spectrograms
            n_fft = 2048 # frequency resolution
            hop_length = 512 # temporal resolution
            n_mels = 128 # number of frequency bands used to represent the spectrum
            
            # Creating Mel Spectrogram
            S = librosa.feature.melspectrogram(y=y, sr=sr, n_fft=n_fft, hop_length=hop_length, n_mels=n_mels)

            # Convert power spectrogram to dB scale (logarithmic scale)
            S_db = librosa.power_to_db(S, ref=np.max)

            # Plotting the Mel Spectrogram
            plt.figure(figsize=(10, 4))
            im = librosa.display.specshow(S_db, sr=sr, hop_length=hop_length)
            # plt.title(f"Mel Spectrogram {file}")
            plt.tight_layout()

            # Draw colorbar
            # cbar_ax = plt.gcf().add_axes([0.2, 0, 0.6, 0.05])
            # cbar = plt.colorbar(im, format="%+2.0f dB", cax=cbar_ax, orientation="horizontal")
            # cbar.ax.set_xlabel("dB")
            
            # Saving Mel Spectrograms
            plt.savefig(f"{file[:len(file)-4]}_img.png",bbox_inches='tight', pad_inches=0)

            plt.show()