# 다양한 모델 결과 시각화

이 노트북은 분류, 회귀, 클러스터링 등 다양한 모델의 평가 결과를 시각화하는 코드를 포함합니다.

## 분류 모델 시각화

In [None]:
from sklearn.metrics import confusion_matrix, ConfusionMatrixDisplay, roc_curve, auc, precision_recall_curve
import matplotlib.pyplot as plt


# Confusion Matrix 시각화

In [None]:

y_pred = model.predict(X_test)
conf_matrix = confusion_matrix(y_test, y_pred)
disp = ConfusionMatrixDisplay(confusion_matrix=conf_matrix, display_labels=model.classes_)
disp.plot(cmap='viridis')
plt.title("Confusion Matrix")
plt.show()


# ROC Curve 시각화

In [None]:
y_prob = model.predict_proba(X_test)[:, 1]  # 양성 클래스 확률
fpr, tpr, _ = roc_curve(y_test, y_prob)
roc_auc = auc(fpr, tpr)

plt.figure(figsize=(8, 6))
plt.plot(fpr, tpr, label=f'ROC Curve (AUC = {roc_auc:.2f})')
plt.plot([0, 1], [0, 1], linestyle='--', color='gray')
plt.title("ROC Curve")
plt.xlabel("False Positive Rate")
plt.ylabel("True Positive Rate")
plt.legend(loc="lower right")
plt.show()



# Precision-Recall Curve 시각화

In [None]:

precision, recall, _ = precision_recall_curve(y_test, y_prob)
plt.figure(figsize=(8, 6))
plt.plot(recall, precision, label="Precision-Recall Curve")
plt.title("Precision-Recall Curve")
plt.xlabel("Recall")
plt.ylabel("Precision")
plt.legend(loc="lower left")
plt.show()


---

## 회귀 모델 시각화

# 산점도 (실제값 vs 예측값)

In [None]:
plt.figure(figsize=(8, 6))
plt.scatter(y_test, y_pred, alpha=0.5)
plt.plot([y_test.min(), y_test.max()], [y_test.min(), y_test.max()], 'k--', lw=2)
plt.title("Actual vs Predicted")
plt.xlabel("Actual Values")
plt.ylabel("Predicted Values")
plt.show()



# 잔차 플롯 (Residual Plot)

In [None]:


residuals = y_test - y_pred
plt.figure(figsize=(8, 6))
plt.scatter(y_pred, residuals, alpha=0.5)
plt.axhline(y=0, color='r', linestyle='--')
plt.title("Residual Plot")
plt.xlabel("Predicted Values")
plt.ylabel("Residuals")
plt.show()



# Feature Importance 시각화 (회귀 모델)

In [None]:

if hasattr(model, 'feature_importances_'):
    feature_importance = model.feature_importances_
    feature_names = X.columns

    plt.figure(figsize=(10, 6))
    plt.barh(feature_names, feature_importance, color='skyblue')
    plt.title("Feature Importance")
    plt.xlabel("Importance Score")
    plt.show()

---

## 클러스터링 모델 시각화

In [None]:

from sklearn.decomposition import PCA

# PCA를 사용한 2D 시각화
pca = PCA(n_components=2)
X_pca = pca.fit_transform(X)

plt.figure(figsize=(8, 6))
plt.scatter(X_pca[:, 0], X_pca[:, 1], c=cluster_labels, cmap='viridis', alpha=0.5)
plt.title("Clustering Visualization with PCA")
plt.xlabel("Principal Component 1")
plt.ylabel("Principal Component 2")
plt.colorbar(label='Cluster')
plt.show()


## 차원 축소 결과 시각화

In [None]:

plt.figure(figsize=(8, 6))
plt.scatter(X_reduced[:, 0], X_reduced[:, 1], c=labels, cmap='viridis', alpha=0.5)
plt.title("Dimensionality Reduction Visualization")
plt.xlabel("Reduced Dimension 1")
plt.ylabel("Reduced Dimension 2")
plt.colorbar(label='Class/Cluster')
plt.show()


## 일반 산점도

In [None]:

# 일반 산점도
plt.figure(figsize=(8, 6))
plt.scatter(X[:, 0], X[:, 1], c=y, cmap='viridis', alpha=0.5)
plt.title("General Scatter Plot")
plt.xlabel("Feature 1")
plt.ylabel("Feature 2")
plt.colorbar(label='Target/Cluster')
plt.show()
