In [1]:
# Dependencies
import pandas as pd

## Merging Rent, Population and Amenities Data for Dashboard Use


This script ***merges city rent & population data with amenities data (hospitals, schools, supermarkets)***, calculates population-normalized metrics (per 100k), and saves the result as 'dashboard_data.csv' to be used in an interactive data visualization dashboard.

In [None]:
# Load the data files
rent_df = pd.read_csv("../Output/city_rent_population.csv")
amenities_df = pd.read_csv("../Output/city_amenities_data.csv")

In [3]:
# Prepare and clean
amenities_df.rename(columns={"Unnamed: 0": "City"}, inplace=True)
rent_df["City"] = rent_df["City"].str.strip()

In [6]:
# Merge on 'City'
merged_df = pd.merge(rent_df, amenities_df, on="City", how="inner")

In [8]:
# Calculate amenities per 100k population
merged_df["hospitals_per_100k"] = (merged_df["hospitals_count"] / merged_df["Population(2021)"]) * 100000
merged_df["schools_per_100k"] = (merged_df["universities_count"] / merged_df["Population(2021)"]) * 100000
merged_df["groceries_per_100k"] = (merged_df["supermarkets_count"] / merged_df["Population(2021)"]) * 100000

In [None]:
# Save final dataset for dashboard use
merged_df.to_csv("../Output/dashboard_data.csv", index=False)

print("✅ 'dashboard_data.csv' created successfully.")

✅ 'dashboard_data.csv' created successfully.
