In [8]:
import pandas as pd

from sklearn.tree import DecisionTreeClassifier
from sklearn.svm import SVC
from sklearn.ensemble import RandomForestClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from sklearn.neighbors import KNeighborsClassifier
from sklearn.preprocessing import StandardScaler


DATASET_PATH = "dataset/diabetes.csv"  # 본인이 mobile.csv를 저장한 경로를 입력합니다.
# DATASET_PATH = "https://github.com/MyungKyuYi/AI-class/blob/main/diabetes.csv"

if __name__ == "__main__":
    iris_dataset = pd.read_csv(DATASET_PATH)

    x_data = iris_dataset.iloc[:, :-1]
    y_data = iris_dataset.iloc[:, -1] 

    X_train, X_test, Y_train, Y_test = train_test_split(x_data, y_data, test_size=0.3, random_state=42)
    
    scaler = StandardScaler()
    X_train = scaler.fit_transform(X_train)
    X_test = scaler.transform(X_test)

    classifier_list = []
    classifier_list.append(("DT", DecisionTreeClassifier()))
    classifier_list.append(("RF", RandomForestClassifier()))
    classifier_list.append(("SVM", SVC()))
    classifier_list.append(("LR", LogisticRegression(max_iter=3000)))
    classifier_list.append(("KNN", KNeighborsClassifier(n_neighbors=3)))
    
    for name, model in classifier_list:
        model.fit(X_train, Y_train)
        model_pred = model.predict(X_test)
        accuracy = accuracy_score(Y_test, model_pred)
        print(f"{name}: {accuracy:.4f}")    


DT: 0.7013
RF: 0.7446
SVM: 0.7446
LR: 0.7359
KNN: 0.7100
