# Heart Disease Prediction using Machine Learning
This notebook covers loading data, preprocessing, training a machine learning model, and evaluating its performance.

In [None]:
# Import necessary libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report, ConfusionMatrixDisplay

In [None]:
# Load dataset
df = pd.read_csv('https://raw.githubusercontent.com/plotly/datasets/master/heart.csv')
df.head()

In [None]:
# Basic information
df.info()

In [None]:
# Check for missing values
df.isnull().sum()

In [None]:
# Data visualization
sns.countplot(x='target', data=df)
plt.title('Heart Disease Distribution')
plt.show()

In [None]:
# Split data into features and target
X = df.drop('target', axis=1)
y = df['target']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [None]:
# Train model
model = RandomForestClassifier()
model.fit(X_train, y_train)
y_pred = model.predict(X_test)

In [None]:
# Evaluate model
print("Accuracy:", accuracy_score(y_test, y_pred))
print("\nClassification Report:\n", classification_report(y_test, y_pred))

In [None]:
# Confusion Matrix
cm = confusion_matrix(y_test, y_pred)
disp = ConfusionMatrixDisplay(confusion_matrix=cm)
disp.plot()
plt.show()