# Anemia in Heart Failure Patients: Data Analysis & Visualization

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline

In [None]:
# Load the dataset
df = pd.read_csv('anemia_hf_data.csv')
df.head()

In [None]:
# Convert Yes/No to 1/0 for analysis
df['IV_Iron_Administered'] = df['IV_Iron_Administered'].map({'Yes': 1, 'No': 0})
df['Readmitted_in_30_Days'] = df['Readmitted_in_30_Days'].map({'Yes': 1, 'No': 0})

In [None]:
# Descriptive Statistics
df.describe()

In [None]:
# Boxplot: Hemoglobin vs Readmission
sns.boxplot(x='Readmitted_in_30_Days', y='Hemoglobin_g_dL', data=df)
plt.title('Hemoglobin Levels vs 30-Day Readmission')
plt.xlabel('Readmitted (1=Yes, 0=No)')
plt.ylabel('Hemoglobin (g/dL)')
plt.tight_layout()
plt.show()

In [None]:
# Barplot: IV Iron Therapy vs Readmission
sns.barplot(x='IV_Iron_Administered', y='Readmitted_in_30_Days', data=df, ci=None)
plt.title('Impact of IV Iron Therapy on 30-Day Readmission')
plt.xlabel('IV Iron Administered (1=Yes, 0=No)')
plt.ylabel('Readmission Rate')
plt.tight_layout()
plt.show()

In [None]:
# Correlation Heatmap
correlation = df[['Hemoglobin_g_dL', 'Ferritin_ng_mL', 'TSAT_pct', 'EF_pct', 'Readmitted_in_30_Days']].corr()
sns.heatmap(correlation, annot=True, cmap='coolwarm')
plt.title('Correlation Matrix')
plt.tight_layout()
plt.show()