# EDA ON HEART ATTACK ANALYSIS 

![](https://hips.hearstapps.com/hmg-prod.s3.amazonaws.com/images/701/heart-2-1489779361.jpg?resize=480:*)

![](https://img.webmd.com/dtmcms/live/webmd/consumer_assets/site_images/article_thumbnails/slideshows/heart_attack_101_slideshow/650x350_heart_attack_101_slideshow.jpg)

# A heart attack occurs when the flow of blood to the heart is blocked. The blockage is most often a buildup of fat, cholesterol and other substances, which form a plaque in the arteries that feed the heart (coronary arteries).

# IMPORTING THE NECESSARY LIBRARIES

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import scipy as sp
import seaborn as sns
import re
import os
import time
import plotly.express as px


# READING THE FILE

In [None]:
data=pd.read_csv("/kaggle/input/heart-attack-analysis-prediction-dataset/heart.csv")

# INFORMATION ABOUT DATASET

In [None]:
data.head()

In [None]:
data.tail()

In [None]:
data.info()

In [None]:
data.shape   #displaying the records and columns

In [None]:
data.loc[data.duplicated()]

In [None]:
data.isnull().sum()

In [None]:
data.duplicated().sum()

About this dataset Age : Age of the patient

Sex : Sex of the patient

exang: exercise induced angina (1 = yes; 0 = no)

ca: number of major vessels (0-3)

cp : Chest Pain type chest pain type

Value 1: typical angina Value 2: atypical angina Value 3: non-anginal pain Value 4: asymptomatic trtbps : resting blood pressure (in mm Hg)

chol : cholestoral in mg/dl fetched via BMI sensor

In [None]:
data.corr()

In [None]:
data.head(3)

In [None]:
len(data["age"].unique())

In [None]:
data.value_counts

# ANALYSIS 

# 1)UNI-VARIATE ANALYSIS:

In [None]:
plt.figure(figsize=(18,10))
plt.style.use("ggplot")
sns.countplot(x=data["age"])    #using countplot
plt.title("COUNT OF PATIENTS AGE",fontsize=20)
plt.xlabel("AGE",fontsize=20)
plt.ylabel("COUNT",fontsize=20)
plt.show()

SO WE FIND THAT MOST OF THE PATIENTS HAVE AGE 58

In [None]:
data.head(2)

In [None]:
s=data["sex"].value_counts().reset_index()
px.pie(s,names="index",values="sex")  #using pie here


So we find that around 207 are Male patients & 96 are Female patients:

In [None]:
c=data["cp"].value_counts().reset_index()
c

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.barplot(x=c["index"],y=c["cp"])   #using bar here for visualization
plt.title("TYPE OF CHEST PAIN WITH NUMBER OF PATIENTS",fontsize=20)
plt.xlabel("TYPE",fontsize=20)
plt.ylabel("COUNT",fontsize=20)
plt.show()

So we find that most of the patients have type Value 1 that is typical angina Value:

In [None]:
data.head(3)

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.displot(data["trtbps"])   #using displot here
plt.title("DISTRIBUTION OF BLOOD PRESSURE AROUND PATIENTS",fontsize=18)
plt.xlabel("BLOOD PRESSURE",fontsize=20)
plt.ylabel("COUNT",fontsize=20)
plt.show()

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.displot(data["chol"])
plt.title("DISTRIBUTION OF CHOLESTROL LEVEL AROUND PATIENTS",fontsize=18)
plt.xlabel("CHOLESTROL LEVEL",fontsize=20)
plt.ylabel("COUNT",fontsize=20)
plt.show()

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.displot(data["thalachh"])
plt.title("DISTRIBUTION OF HEART RATE AROUND PATIENTS",fontsize=18)
plt.xlabel("HEART RATE",fontsize=20)
plt.ylabel("COUNT",fontsize=20)
plt.show()

In [None]:
data.head(2)

# 2)BIVARIATE-ANALYSIS:

# 1)AGE

In [None]:
data[["age","output"]].value_counts().sort_values()

In [None]:
v=pd.crosstab(data["age"],data["output"]).reset_index()

v.columns=["age","low_risk","high_risk"]
v

In [None]:
px.line(v,v["age"],v["high_risk"],title="RISK OF HIGH HEART-ATTACK WITH AGE")


In [None]:
px.line(v,v["age"],v["low_risk"],title="RISK OF LOW HEART-ATTACK WITH AGE")

In [None]:
data.head(3)

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.lineplot(y="trtbps",x="age",data=data)
plt.title("BLOOD PRESSURE WITH AGE",fontsize=20)
plt.xlabel("AGE",fontsize=20)
plt.ylabel("BLOOD PRESSURE",fontsize=20)
plt.show()

SO WE FIND THAT THERE IS HIGH CHANCES OF INCREASE IN THE BLOOD PRESSURE WITH INCREASE IN THE AGE:

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.lineplot(y="chol",x="age",data=data)
plt.title("CHOLESTROL LEVEL  WITH AGE",fontsize=20)
plt.xlabel("AGE",fontsize=20)
plt.ylabel("CHOLESTROL LEVEL",fontsize=20)
plt.show()

SO WE FIND THAT THERE IS HIGH CHANCES OF INCREASE IN CHOLESTROL LEVEL IN THE BODY WITH INCREASE IN THE AGE:

In [None]:
plt.figure(figsize=(20,10))
plt.style.use("ggplot")
sns.lineplot(y="thalachh",x="age",data=data)
plt.title("HEART RATE  WITH AGE",fontsize=20)
plt.xlabel("AGE",fontsize=20)
plt.ylabel("HEART RATE",fontsize=20)
plt.show()

AS WE CAN SEE WITH INCREASE IN THE AGE OF THE PATIENTS THE HEART RATE IS GETTING LOWER:

In [None]:
data.head(2)

# Q1) DOES INCREASE IN CHOLESTROL LEVEL IN BODY HAVE ANY EFFECT TOWARDS THE HEART ATTACK:

In [None]:
plt.figure(figsize=(10,6))
plt.style.use("ggplot")
sns.lineplot(x="age",y="trtbps",hue="output",data=data)
plt.title("EFFECT OF HEART ATTACK WITH INCREASE IN AGE AND BLOOD PRESSURE")
plt.show()

In [None]:
plt.figure(figsize=(10,6))
plt.style.use("ggplot")
sns.lineplot(x="age",y="thalachh",hue="output",data=data)
plt.title("EFFECT OF HEART ATTACK WITH INCREASE IN AGE AND MAXIMUM HEART RATE")
plt.show()

In [None]:
plt.figure(figsize=(18,8))
sns.heatmap(data.corr(),annot=True,cmap="PuBuGn")  #using heatmap here

In [None]:
sns.scatterplot(y="chol",x="output",data=data)

In [None]:
sns.regplot(y="chol",x="output",data=data)

In [None]:
sns.swarmplot(y="chol",x="output",data=data)

In [None]:
plt.figure(figsize=(12,8))
plt.style.use("ggplot")
sns.histplot(data = data, x = 'age', hue = 'output')
plt.title("DOES AGE EFFECT THE HEART-ATTACK")
plt.xlabel("Age")
plt.ylabel("Count")
plt.show()

# SO WE MADE THE FOLLOWING CONCLUSIONS:
# 
# 1.With increasing in age the cholestrol level of the body is increasing. nd if the body has high cholestrol level there is high chances of heart attack.
# 2.With increasing in the age there is the low risk of heart attack:
# 3.Increasing in heart rate will have high chances of heart attack:
# 4.A heart attack occurs when the flow of blood to the heart is blocked.

# IF YOU HAVE ANY QUESTIONS THEN PLZ COMMENT DOWN 
# IF YOU LIKE IT PLEASE UPVOTE ,WAITING FOR YOUR VALUABLE FEEDBACK !!