In [1]:
import _pickle as cPickle

import pandas as pd

import numpy as np

def mean_normalize(featureMatrix):
    """Normalizes each feature (column in the matrix) by making them have zero mean and unit variance.
    Args:
      featureMatrix: Each row is a feature vector corresponding to one audio recording. Each column
    represents values of different feature vectors for one feature.
    Returns:
      Original matrix but values are modified such that each feature has zero mean and unit variance.
    """
    mean = np.mean(featureMatrix, axis=0)  # compute mean of each column (feature)
    std = np.std(featureMatrix, axis=0, ddof=1)  # compute sample std of each column (feature)

    featureMatrix -= mean  # subtract each column's mean from every value in the corresponding column
    featureMatrix /= std  # divide values in each column with the corresponding sample std for that column

    return featureMatrix

In [2]:
    training_examples = mean_normalize(pd.read_pickle('Extracted_Features-notFold10_features.pkl'))
    print(training_examples)
    
    training_labels = pd.read_pickle('Extracted_Features-notFold10_labels.pkl')
    print(training_labels)

           1         2         3         4         5         6         7    \
0    -0.875542 -0.622549 -1.090828 -0.090771 -2.263999 -1.900575 -1.218669   
1    -0.530166 -0.603892 -3.786665  1.381130 -2.682635 -0.178429 -3.085594   
2     0.280982 -0.549262 -0.706601  1.300636  1.189285  0.096146  0.675431   
3     0.592061  1.829181  0.962011  0.172504  0.646491 -0.228645 -0.200837   
4     0.764453 -0.770179  0.638805  1.127109  0.424002  1.155224 -0.342862   
5     0.823503  0.637886 -0.010350  0.051369  1.129698  0.191977  0.799904   
6     0.400374 -0.049567  0.844638  0.326067  0.455439  1.104650 -0.329534   
7     0.626530 -0.311542  1.004811  0.764647  0.304599  0.501288 -0.468860   
8    -0.030379  2.252392 -1.962940 -1.539425 -1.629150 -1.485747 -1.887235   
9     0.564187 -2.619802  1.681387  0.548475  1.832969  0.761291  1.133038   
10   -0.847911 -0.638604 -1.497012 -1.597428  1.063349  0.964635  0.104981   
11    0.279747  0.411525 -0.107634  0.133261  1.433032  0.270771