# Imports

In [1]:
import pandas as pd

!pip install praat-parselmouth
import parselmouth

from feature_extraction_utils import *



# Read in Sample Sound File (.wav)

In [2]:
sound_filepath = 'sample.wav'
sound = parselmouth.Sound(sound_filepath)
df = pd.DataFrame()

# Extract Features

In [3]:
attributes = {}

intensity_attributes = get_intensity_attributes(sound)[0]
pitch_attributes = get_pitch_attributes(sound)[0]
attributes.update(intensity_attributes)
attributes.update(pitch_attributes)

hnr_attributes = get_harmonics_to_noise_ratio_attributes(sound)[0]
gne_attributes = get_glottal_to_noise_ratio_attributes(sound)[0]
attributes.update(hnr_attributes)
attributes.update(gne_attributes)

df['local_jitter'] = None
df['local_shimmer'] = None
df.at[0, 'local_jitter'] = get_local_jitter(sound)
df.at[0, 'local_shimmer'] = get_local_shimmer(sound)

spectrum_attributes = get_spectrum_attributes(sound)[0]
attributes.update(spectrum_attributes)

formant_attributes = get_formant_attributes(sound)[0]
attributes.update(formant_attributes)

lfcc_matrix, mfcc_matrix = get_lfcc(sound), get_mfcc(sound)
df['lfcc'] = None
df['mfcc'] = None
df.at[0, 'lfcc'] = lfcc_matrix
df.at[0, 'mfcc'] = mfcc_matrix

delta_mfcc_matrix = get_delta(mfcc_matrix)
delta_delta_mfcc_matrix = get_delta(delta_mfcc_matrix)
df['delta_mfcc'] = None
df['delta_delta_mfcc'] = None
df.at[0, 'delta_mfcc'] = delta_mfcc_matrix
df.at[0, 'delta_delta_mfcc'] = delta_delta_mfcc_matrix

for attribute in attributes:
    df.at[0, attribute] = attributes[attribute]
    
df.at[0, 'sound_filepath'] = sound_filepath
rearranged_columns = df.columns.tolist()[-1:] + df.columns.tolist()[:-1]
df = df[rearranged_columns]

# Visualize Features

In [4]:
df

Unnamed: 0,sound_filepath,local_jitter,local_shimmer,lfcc,mfcc,delta_mfcc,delta_delta_mfcc,min_intensity,relative_min_intensity_time,max_intensity,...,f1_median,f2_median,f3_median,f4_median,formant_dispersion,average_formant,mff,fitch_vtl,delta_f,vtl_delta_f
0,sample.wav,0.0268438,0.0978643,"[[-0.05431217830930484, 0.05285244343900683, -...","[[70.51424251467743, 33.14143488496505, 45.545...","[[5.945542519810594, -4.017987084089242, 7.127...","[[-0.5935564105623996, 0.822749125054675, -4.8...",37.617361,0.977288,77.765843,...,377.805905,1169.953315,2174.813447,3112.286328,911.493474,1708.714749,1315.17852,21.348392,870.184223,20.110684
