<a href="https://colab.research.google.com/github/elixirutkarsh/GettingStarted/blob/main/gettingstrted.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
# Import libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score

# Load the dataset
heart_data = pd.read_csv('heart_attack_data.csv')

# Explore the dataset
print(heart_data.head())
print(heart_data.info())
print(heart_data.describe())
print(heart_data.shape)

# Handle missing data (if any)
heart_data.dropna(inplace=True)  # Drop rows with missing values

# Visualize the target variable
sns.countplot(x='target', data=heart_data)
plt.title('Heart Attack Distribution')
plt.show()

# Visualize feature distributions
sns.histplot(data=heart_data, x='age', kde=True)
plt.title('Age Distribution')
plt.show()

sns.boxplot(data=heart_data, x='chol')
plt.title('Cholesterol Distribution')
plt.show()

# Explore feature relationships
sns.scatterplot(data=heart_data, x='age', y='chol', hue='target')
plt.title('Age vs Cholesterol')
plt.show()

sns.heatmap(heart_data.corr(), annot=True, cmap='coolwarm')
plt.title('Correlation Matrix')
plt.show()

# Preprocess the data
X = heart_data.drop('target', axis=1)
y = heart_data['target']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Build a prediction model (using Logistic Regression)
model = LogisticRegression()
model.fit(X_train, y_train)

# Make predictions
y_pred = model.predict(X_test)

# Evaluate model performance
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred)
recall = recall_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred)

print('Accuracy:', accuracy)
print('Precision:', precision)
print('Recall:', recall)
print('F1-Score:', f1)

# Fine-tune the model (if necessary)

# Summarize findings

