#### Importing Libraries

In [1]:
import pandas as pd
import numpy as np
from sklearn import preprocessing
import matplotlib.pyplot as plt 
plt.rc("font", size=14)
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split
import seaborn as sns
sns.set(style="white")
sns.set(style="whitegrid", color_codes=True)

#### Get from CSV File

In [2]:
data = pd.read_csv(r'Parkinsons Train Data.csv', header=0)
data = data.dropna()
print(data.shape)
print(list(data.columns))

(1040, 28)
['Subject Id', 'Jitter(local)', 'Jitter(local, absolute)', 'Jitter (rap)', 'Jitter (ppq5)', 'Jitter (ddp)', 'Shimmer (local)', 'Shimmer (local, db)', 'Shimmer (apq3)', 'Shimmer (apq5)', 'Shimmer (apq11)', 'Shimmer (dda)', 'AC', 'NDH', 'HTM', 'Median Pitch', 'Mean Pitch', 'Standard deviation', 'Minimum pitch', 'Maximum pitch', 'Number of pulses', 'Number of periods', 'Mean period', 'Standard deviation of period', 'Fraction of locally unvoiced frames', 'Number of voice breaks', 'Degree of voice breaks', 'Class information']


#### Viewing the datasets

In [3]:
data.head()

Unnamed: 0,Subject Id,Jitter(local),"Jitter(local, absolute)",Jitter (rap),Jitter (ppq5),Jitter (ddp),Shimmer (local),"Shimmer (local, db)",Shimmer (apq3),Shimmer (apq5),...,Minimum pitch,Maximum pitch,Number of pulses,Number of periods,Mean period,Standard deviation of period,Fraction of locally unvoiced frames,Number of voice breaks,Degree of voice breaks,Class information
0,1,1.488,9e-05,0.9,0.794,2.699,8.334,0.779,4.517,4.609,...,142.229,187.576,160,159,0.006065,0.000416,0.0,0,0.0,1
1,1,0.728,3.8e-05,0.353,0.376,1.059,5.864,0.642,2.058,3.18,...,159.515,234.505,170,169,0.005181,0.000403,2.247,0,0.0,1
2,1,1.22,7.4e-05,0.732,0.67,2.196,8.719,0.875,4.347,5.166,...,146.445,211.442,1431,1427,0.006071,0.000474,10.656,1,0.178,1
3,1,2.502,0.000123,1.156,1.634,3.469,13.513,1.273,5.263,8.771,...,182.713,220.23,94,92,0.00491,0.00032,0.0,0,0.0,1
4,1,3.509,0.000167,1.715,1.539,5.145,9.112,1.04,3.102,4.927,...,182.821,225.162,117,114,0.004757,0.00038,18.182,1,13.318,1


#### ML Method - Neural Networks

In [4]:
def getNN(X, y):
    X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=66, stratify=data['Class information'])
    from sklearn.neural_network import MLPClassifier

    mlp = MLPClassifier(random_state=42)
    mlp.fit(X_train, y_train)

    print("Accuracy on training set: {:.2f}".format(mlp.score(X_train, y_train)))
    print("Accuracy on test set: {:.2f}".format(mlp.score(X_test, y_test)))
    
    print("\nUsing Standard Scaler")
    
    from sklearn.preprocessing import StandardScaler

    scaler = StandardScaler()
    X_train_scaled = scaler.fit_transform(X_train)
    X_test_scaled = scaler.fit_transform(X_test)

    mlp = MLPClassifier(random_state=0)
    mlp.fit(X_train_scaled, y_train)

    print("Accuracy on training set: {:.3f}".format(
        mlp.score(X_train_scaled, y_train)))
    print("Accuracy on test set: {:.3f}".format(mlp.score(X_test_scaled, y_test)))
    
    print("\nUsing a maximum iterations of 1000")
    
    mlp = MLPClassifier(max_iter=1000, random_state=0)
    mlp.fit(X_train_scaled, y_train)

    print("Accuracy on training set: {:.3f}".format(
        mlp.score(X_train_scaled, y_train)))
    print("Accuracy on test set: {:.3f}".format(mlp.score(X_test_scaled, y_test)))
    
    print("\nUsing alpha = 1")
    
    mlp = MLPClassifier(max_iter=1000, alpha=1, random_state=0)
    mlp.fit(X_train_scaled, y_train)

    print("Accuracy on training set: {:.3f}".format(
        mlp.score(X_train_scaled, y_train)))
    print("Accuracy on test set: {:.3f}".format(mlp.score(X_test_scaled, y_test)))

In [5]:
y = data['Class information']

In [6]:
cols_1 = ['Jitter(local)','Shimmer (local)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_1]

In [7]:
getNN(X, y)

Accuracy on training set: 0.69
Accuracy on test set: 0.64

Using Standard Scaler




Accuracy on training set: 0.791
Accuracy on test set: 0.692

Using a maximum iterations of 1000




Accuracy on training set: 0.919
Accuracy on test set: 0.665

Using alpha = 1
Accuracy on training set: 0.774
Accuracy on test set: 0.685


In [8]:
cols_2 = ['Jitter(local)','Shimmer (local, db)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_2]

In [9]:
getNN(X, y)

Accuracy on training set: 0.62
Accuracy on test set: 0.63

Using Standard Scaler




Accuracy on training set: 0.791
Accuracy on test set: 0.692

Using a maximum iterations of 1000




Accuracy on training set: 0.912
Accuracy on test set: 0.650

Using alpha = 1
Accuracy on training set: 0.777
Accuracy on test set: 0.700


In [10]:
cols_3 = ['Jitter(local)','Shimmer (apq3)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_3]

In [11]:
getNN(X, y)

Accuracy on training set: 0.65
Accuracy on test set: 0.65

Using Standard Scaler




Accuracy on training set: 0.794
Accuracy on test set: 0.681

Using a maximum iterations of 1000




Accuracy on training set: 0.922
Accuracy on test set: 0.654

Using alpha = 1
Accuracy on training set: 0.771
Accuracy on test set: 0.669


In [12]:
cols_4 = ['Jitter(local)','Shimmer (apq5)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_4]

In [13]:
getNN(X, y)

Accuracy on training set: 0.68
Accuracy on test set: 0.63

Using Standard Scaler




Accuracy on training set: 0.795
Accuracy on test set: 0.669

Using a maximum iterations of 1000




Accuracy on training set: 0.918
Accuracy on test set: 0.635

Using alpha = 1
Accuracy on training set: 0.778
Accuracy on test set: 0.688


In [14]:
cols_5 = ['Jitter(local)','Shimmer (apq11)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_5]

In [15]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.63

Using Standard Scaler




Accuracy on training set: 0.804
Accuracy on test set: 0.712

Using a maximum iterations of 1000




Accuracy on training set: 0.923
Accuracy on test set: 0.696

Using alpha = 1
Accuracy on training set: 0.786
Accuracy on test set: 0.692


In [16]:
cols_6 = ['Jitter(local)','Shimmer (dda)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_6]

In [17]:
getNN(X, y)

Accuracy on training set: 0.69
Accuracy on test set: 0.65

Using Standard Scaler




Accuracy on training set: 0.794
Accuracy on test set: 0.681

Using a maximum iterations of 1000




Accuracy on training set: 0.923
Accuracy on test set: 0.654

Using alpha = 1
Accuracy on training set: 0.768
Accuracy on test set: 0.669


In [18]:
cols_7 = ['Jitter(local, absolute)','Shimmer (local)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_7]

In [19]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.63

Using Standard Scaler




Accuracy on training set: 0.786
Accuracy on test set: 0.688

Using a maximum iterations of 1000




Accuracy on training set: 0.918
Accuracy on test set: 0.654

Using alpha = 1
Accuracy on training set: 0.782
Accuracy on test set: 0.673


In [20]:
cols_8 = ['Jitter(local, absolute)','Shimmer (local, db)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_8]

In [21]:
getNN(X, y)

Accuracy on training set: 0.64
Accuracy on test set: 0.62

Using Standard Scaler




Accuracy on training set: 0.791
Accuracy on test set: 0.692

Using a maximum iterations of 1000




Accuracy on training set: 0.927
Accuracy on test set: 0.646

Using alpha = 1
Accuracy on training set: 0.786
Accuracy on test set: 0.681


In [22]:
cols_9 = ['Jitter(local, absolute)','Shimmer (apq3)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_9]

In [23]:
getNN(X, y)

Accuracy on training set: 0.64
Accuracy on test set: 0.62

Using Standard Scaler




Accuracy on training set: 0.792
Accuracy on test set: 0.665

Using a maximum iterations of 1000




Accuracy on training set: 0.919
Accuracy on test set: 0.608

Using alpha = 1
Accuracy on training set: 0.782
Accuracy on test set: 0.654


In [24]:
cols_10 = ['Jitter(local, absolute)','Shimmer (apq5)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_10]

In [25]:
getNN(X, y)

Accuracy on training set: 0.64
Accuracy on test set: 0.59

Using Standard Scaler




Accuracy on training set: 0.796
Accuracy on test set: 0.662

Using a maximum iterations of 1000




Accuracy on training set: 0.923
Accuracy on test set: 0.631

Using alpha = 1
Accuracy on training set: 0.790
Accuracy on test set: 0.669


In [26]:
cols_11 = ['Jitter(local, absolute)','Shimmer (apq11)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_11]

In [27]:
getNN(X, y)

Accuracy on training set: 0.66
Accuracy on test set: 0.65

Using Standard Scaler




Accuracy on training set: 0.796
Accuracy on test set: 0.688

Using a maximum iterations of 1000




Accuracy on training set: 0.933
Accuracy on test set: 0.685

Using alpha = 1
Accuracy on training set: 0.792
Accuracy on test set: 0.696


In [28]:
cols_12 = ['Jitter(local, absolute)','Shimmer (dda)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_12]

In [29]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.65

Using Standard Scaler




Accuracy on training set: 0.791
Accuracy on test set: 0.665

Using a maximum iterations of 1000




Accuracy on training set: 0.921
Accuracy on test set: 0.619

Using alpha = 1
Accuracy on training set: 0.792
Accuracy on test set: 0.654


In [30]:
cols_13 = ['Jitter (rap)','Shimmer (local)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_13]

In [31]:
getNN(X, y)

Accuracy on training set: 0.69
Accuracy on test set: 0.63

Using Standard Scaler




Accuracy on training set: 0.783
Accuracy on test set: 0.715

Using a maximum iterations of 1000




Accuracy on training set: 0.927
Accuracy on test set: 0.665

Using alpha = 1
Accuracy on training set: 0.779
Accuracy on test set: 0.696


In [32]:
cols_14 = ['Jitter (rap)','Shimmer (local, db)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_14]

In [33]:
getNN(X, y)

Accuracy on training set: 0.62
Accuracy on test set: 0.62

Using Standard Scaler




Accuracy on training set: 0.790
Accuracy on test set: 0.742

Using a maximum iterations of 1000




Accuracy on training set: 0.924
Accuracy on test set: 0.677

Using alpha = 1
Accuracy on training set: 0.787
Accuracy on test set: 0.704


In [34]:
cols_15 = ['Jitter (rap)','Shimmer (apq3)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_15]

In [35]:
getNN(X, y)

Accuracy on training set: 0.66
Accuracy on test set: 0.64

Using Standard Scaler




Accuracy on training set: 0.777
Accuracy on test set: 0.700

Using a maximum iterations of 1000




Accuracy on training set: 0.922
Accuracy on test set: 0.631

Using alpha = 1
Accuracy on training set: 0.765
Accuracy on test set: 0.685


In [36]:
cols_16 = ['Jitter (rap)','Shimmer (apq5)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_16]

In [37]:
getNN(X, y)

Accuracy on training set: 0.68
Accuracy on test set: 0.61

Using Standard Scaler




Accuracy on training set: 0.795
Accuracy on test set: 0.715

Using a maximum iterations of 1000




Accuracy on training set: 0.915
Accuracy on test set: 0.638

Using alpha = 1
Accuracy on training set: 0.787
Accuracy on test set: 0.669


In [38]:
cols_17 = ['Jitter (rap)','Shimmer (apq11)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_17]

In [39]:
getNN(X, y)

Accuracy on training set: 0.66
Accuracy on test set: 0.64

Using Standard Scaler




Accuracy on training set: 0.790
Accuracy on test set: 0.731

Using a maximum iterations of 1000




Accuracy on training set: 0.937
Accuracy on test set: 0.700

Using alpha = 1
Accuracy on training set: 0.771
Accuracy on test set: 0.727


In [40]:
cols_18 = ['Jitter (rap)','Shimmer (dda)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_18]

In [41]:
getNN(X, y)

Accuracy on training set: 0.70
Accuracy on test set: 0.66

Using Standard Scaler




Accuracy on training set: 0.776
Accuracy on test set: 0.704

Using a maximum iterations of 1000




Accuracy on training set: 0.922
Accuracy on test set: 0.642

Using alpha = 1
Accuracy on training set: 0.763
Accuracy on test set: 0.685


In [42]:
cols_19 = ['Jitter (ppq5)','Shimmer (local)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_19]

In [43]:
getNN(X, y)

Accuracy on training set: 0.68
Accuracy on test set: 0.63

Using Standard Scaler




Accuracy on training set: 0.778
Accuracy on test set: 0.719

Using a maximum iterations of 1000




Accuracy on training set: 0.921
Accuracy on test set: 0.654

Using alpha = 1
Accuracy on training set: 0.776
Accuracy on test set: 0.688


In [44]:
cols_20 = ['Jitter (ppq5)','Shimmer (local, db)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_20]

In [45]:
getNN(X, y)

Accuracy on training set: 0.60
Accuracy on test set: 0.60

Using Standard Scaler




Accuracy on training set: 0.783
Accuracy on test set: 0.719

Using a maximum iterations of 1000




Accuracy on training set: 0.923
Accuracy on test set: 0.673

Using alpha = 1
Accuracy on training set: 0.777
Accuracy on test set: 0.712


In [46]:
cols_21 = ['Jitter (ppq5)','Shimmer (apq3)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_21]

In [47]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.65

Using Standard Scaler




Accuracy on training set: 0.785
Accuracy on test set: 0.696

Using a maximum iterations of 1000




Accuracy on training set: 0.921
Accuracy on test set: 0.669

Using alpha = 1
Accuracy on training set: 0.765
Accuracy on test set: 0.704


In [48]:
cols_22 = ['Jitter (ppq5)','Shimmer (apq5)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_22]

In [49]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.62

Using Standard Scaler




Accuracy on training set: 0.779
Accuracy on test set: 0.715

Using a maximum iterations of 1000




Accuracy on training set: 0.917
Accuracy on test set: 0.635

Using alpha = 1
Accuracy on training set: 0.779
Accuracy on test set: 0.700


In [50]:
cols_23 = ['Jitter (ppq5)','Shimmer (apq11)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_23]

In [51]:
getNN(X, y)

Accuracy on training set: 0.70
Accuracy on test set: 0.65

Using Standard Scaler




Accuracy on training set: 0.783
Accuracy on test set: 0.715

Using a maximum iterations of 1000




Accuracy on training set: 0.941
Accuracy on test set: 0.704

Using alpha = 1
Accuracy on training set: 0.765
Accuracy on test set: 0.704


In [52]:
cols_24 = ['Jitter (ppq5)','Shimmer (dda)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_24]

In [53]:
getNN(X, y)

Accuracy on training set: 0.70
Accuracy on test set: 0.68

Using Standard Scaler




Accuracy on training set: 0.785
Accuracy on test set: 0.696

Using a maximum iterations of 1000




Accuracy on training set: 0.918
Accuracy on test set: 0.677

Using alpha = 1
Accuracy on training set: 0.765
Accuracy on test set: 0.708


In [54]:
cols_25 = ['Jitter (ddp)','Shimmer (local)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_25]
y = data['Class information']

In [55]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.66

Using Standard Scaler




Accuracy on training set: 0.783
Accuracy on test set: 0.719

Using a maximum iterations of 1000




Accuracy on training set: 0.933
Accuracy on test set: 0.669

Using alpha = 1
Accuracy on training set: 0.786
Accuracy on test set: 0.688


In [56]:
cols_26 = ['Jitter (ddp)','Shimmer (local, db)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_26]

In [57]:
getNN(X, y)

Accuracy on training set: 0.61
Accuracy on test set: 0.60

Using Standard Scaler




Accuracy on training set: 0.788
Accuracy on test set: 0.742

Using a maximum iterations of 1000




Accuracy on training set: 0.923
Accuracy on test set: 0.662

Using alpha = 1
Accuracy on training set: 0.779
Accuracy on test set: 0.696


In [58]:
cols_27 = ['Jitter (ddp)','Shimmer (apq3)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_27]

In [59]:
getNN(X, y)

Accuracy on training set: 0.64
Accuracy on test set: 0.64

Using Standard Scaler




Accuracy on training set: 0.777
Accuracy on test set: 0.700

Using a maximum iterations of 1000




Accuracy on training set: 0.919
Accuracy on test set: 0.642

Using alpha = 1
Accuracy on training set: 0.769
Accuracy on test set: 0.681


In [60]:
cols_28 = ['Jitter (ddp)','Shimmer (apq5)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_28]

In [61]:
getNN(X, y)

Accuracy on training set: 0.67
Accuracy on test set: 0.64

Using Standard Scaler




Accuracy on training set: 0.794
Accuracy on test set: 0.708

Using a maximum iterations of 1000




Accuracy on training set: 0.921
Accuracy on test set: 0.642

Using alpha = 1
Accuracy on training set: 0.791
Accuracy on test set: 0.669


In [62]:
cols_29 = ['Jitter (ddp)','Shimmer (apq11)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_29]

In [63]:
getNN(X, y)

Accuracy on training set: 0.69
Accuracy on test set: 0.62

Using Standard Scaler




Accuracy on training set: 0.788
Accuracy on test set: 0.723

Using a maximum iterations of 1000




Accuracy on training set: 0.935
Accuracy on test set: 0.704

Using alpha = 1
Accuracy on training set: 0.771
Accuracy on test set: 0.723


In [64]:
cols_30 = ['Jitter (ddp)','Shimmer (dda)','AC', 'NDH', 'HTM',
       'Median Pitch', 'Mean Pitch', 'Standard deviation',
       'Minimum pitch', 'Maximum pitch', 'Number of pulses',
       'Number of periods', 'Mean period', 'Standard deviation of period',
       'Fraction of locally unvoiced frames', 'Number of voice breaks',
       'Degree of voice breaks']
X = data[cols_30]
y = data['Class information']

In [65]:
getNN(X, y)

Accuracy on training set: 0.69
Accuracy on test set: 0.67

Using Standard Scaler




Accuracy on training set: 0.777
Accuracy on test set: 0.700

Using a maximum iterations of 1000




Accuracy on training set: 0.924
Accuracy on test set: 0.642

Using alpha = 1
Accuracy on training set: 0.764
Accuracy on test set: 0.685
