In [None]:
import pandas as pd
import matplotlib.pyplot as plt

takotsubo_df = pd.read_csv("takotsubo_cases_metadata.csv")
normal_df = pd.read_csv("normal_cases_metadata.csv")


gender_map = {1: "Female", 0: "Male"}
takotsubo_df["Gender"] = takotsubo_df["Gender"].map(gender_map)
normal_df["Gender"] = normal_df["Gender"].map(gender_map)


takotsubo_df["Class"] = "Takotsubo"
normal_df["Class"] = "Normal"

# Combine for summary
df = pd.concat([takotsubo_df, normal_df], ignore_index=True)

# Gender breakdown
gender_counts = df.groupby(["Class", "Gender"]).size().unstack(fill_value=0)

# Print gender counts
print("Gender Breakdown by Class:")
for cls in gender_counts.index:
    female = gender_counts.loc[cls].get("Female", 0)
    male = gender_counts.loc[cls].get("Male", 0)
    print(f"  {cls}: {female} Female, {male} Male")

# Save histograms
for cls, filename in [("Takotsubo", "takotsubo_age_histogram.png"),
                      ("Normal", "normal_age_histogram.png")]:
    subset = df[df["Class"] == cls]
    plt.figure(figsize=(6, 4))
    plt.hist(subset["Age"], bins=10, color='skyblue', edgecolor='black', alpha=0.8)
    plt.title(f"{cls} Age Distribution")
    plt.xlabel("Age")
    plt.ylabel("Number of Patients")
    plt.tight_layout()
    plt.savefig(f"figures/{filename}")
    plt.close()


Gender Breakdown by Class:
  Normal: 53 Female, 23 Male
  Takotsubo: 84 Female, 8 Male
