In [1]:
import pandas as pd

# ---- CHANGE THESE TWO ONLY ----
TARGET_DISTRICT = "Bengaluru Urban"
TARGET_DATE = "2025-03-01"

# ---- FILE PATHS (edit if needed) ----
enrolment_path = "api_data_aadhar_enrolment_0_500000.csv"
demographic_path = "api_data_aadhar_demographic_0_500000.csv"
biometric_path = "api_data_aadhar_biometric_0_500000.csv"

# ---- LOAD ----
enrol = pd.read_csv(enrolment_path)
demo = pd.read_csv(demographic_path)
bio = pd.read_csv(biometric_path)

# ---- STANDARDIZE ----
for df in [enrol, demo, bio]:
    df.columns = df.columns.str.lower()
    df["date"] = pd.to_datetime(df["date"], errors="coerce")
    df["district"] = df["district"].str.strip()

target_date = pd.to_datetime(TARGET_DATE)

# ---- FILTER ----
enrol_f = enrol[(enrol["district"] == TARGET_DISTRICT) & (enrol["date"] == target_date)]
demo_f  = demo[(demo["district"] == TARGET_DISTRICT) & (demo["date"] == target_date)]
bio_f   = bio[(bio["district"] == TARGET_DISTRICT) & (bio["date"] == target_date)]

# ---- SUM COUNTS ----
enrol_total = enrol_f.filter(like="age").sum().sum()
demo_total  = demo_f.filter(like="age").sum().sum()
bio_total   = bio_f.filter(like="age").sum().sum()

# ---- RESULT ----
result = pd.DataFrame({
    "dataset": ["enrolment", "demographic", "biometric"],
    "total_count": [enrol_total, demo_total, bio_total]
})

print(result)


       dataset  total_count
0    enrolment            0
1  demographic            0
2    biometric            0
