In [18]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score, classification_report

# Load the dataset


In [19]:
csv_file_path = '/kaggle/input/parkinson-disease-detection/Parkinsson disease.csv'
parkinson_data = pd.read_csv(csv_file_path)

In [20]:
X = parkinson_data.drop(columns=['name', 'status'])
y = parkinson_data['status']

# Splitting the dataset into training and testing sets


In [21]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Standardizing the feature values


In [22]:
scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

# Random Forest classifier


In [23]:
rf_classifier = RandomForestClassifier(n_estimators=100, random_state=42)
rf_classifier.fit(X_train_scaled, y_train)
rf_y_pred = rf_classifier.predict(X_test_scaled)

# Gradient Boosting classifier


In [24]:
gb_classifier = GradientBoostingClassifier(n_estimators=100, random_state=42)
gb_classifier.fit(X_train_scaled, y_train)
gb_y_pred = gb_classifier.predict(X_test_scaled)

# Support Vector Classifier


In [25]:
svc_classifier = SVC(kernel='rbf', random_state=42)
svc_classifier.fit(X_train_scaled, y_train)
svc_y_pred = svc_classifier.predict(X_test_scaled)

# Evaluating the models' performance


In [26]:
print("Random Forest Classifier:")
print(f"Accuracy: {accuracy_score(y_test, rf_y_pred) * 100:.2f}%")
print("\nClassification Report:\n", classification_report(y_test, rf_y_pred))

print("\nGradient Boosting Classifier:")
print(f"Accuracy: {accuracy_score(y_test, gb_y_pred) * 100:.2f}%")
print("\nClassification Report:\n", classification_report(y_test, gb_y_pred))

print("\nSupport Vector Classifier:")
print(f"Accuracy: {accuracy_score(y_test, svc_y_pred) * 100:.2f}%")
print("\nClassification Report:\n", classification_report(y_test, svc_y_pred))

Random Forest Classifier:
Accuracy: 94.87%

Classification Report:
               precision    recall  f1-score   support

           0       1.00      0.71      0.83         7
           1       0.94      1.00      0.97        32

    accuracy                           0.95        39
   macro avg       0.97      0.86      0.90        39
weighted avg       0.95      0.95      0.95        39


Gradient Boosting Classifier:
Accuracy: 92.31%

Classification Report:
               precision    recall  f1-score   support

           0       0.83      0.71      0.77         7
           1       0.94      0.97      0.95        32

    accuracy                           0.92        39
   macro avg       0.89      0.84      0.86        39
weighted avg       0.92      0.92      0.92        39


Support Vector Classifier:
Accuracy: 89.74%

Classification Report:
               precision    recall  f1-score   support

           0       1.00      0.43      0.60         7
           1       0.89   