In [6]:
import pandas as pd

# File paths
distances_cbd_trains_schools_path = '/home/Daniel Bi/project two/data/landing/rental_distances_cbd_trains_schools.csv'
parks_path = '/home/Daniel Bi/project two/data/landing/rental_with_parks.csv'
shopping_path = '/home/Daniel Bi/project two/data/landing/rental_with_shopping.csv'

# Step 1: Load all three datasets
df_cbd_trains_schools = pd.read_csv(distances_cbd_trains_schools_path)
df_parks = pd.read_csv(parks_path)
df_shopping = pd.read_csv(shopping_path)

# Step 2: Align based on the 'property_index' in the main dataset and shift the index correctly
# Add 1 to the index of parks and shopping to account for the 0-based index in the main dataset
# However, we subtract 1 to fix the mismatch and properly align the rows
df_parks['property_index'] = df_parks.index  # Correct the index alignment
df_shopping['property_index'] = df_shopping.index  # Correct the index alignment

# Step 3: Select non-overlapping columns to append from parks and shopping datasets
columns_to_append_parks = ['nearest_parks_name', 'nearest_parks_latitude', 'nearest_parks_longitude',
                           'straight_line_distance_parks', 'route_distance_parks']
columns_to_append_shopping = ['nearest_shopping_name', 'nearest_shopping_latitude', 'nearest_shopping_longitude',
                              'straight_line_distance_shopping', 'route_distance_shopping']

# Step 4: Merge the columns from the parks dataset
df_merged = pd.merge(df_cbd_trains_schools, df_parks[['property_index'] + columns_to_append_parks], 
                     on='property_index', how='left')

# Step 5: Merge the columns from the shopping dataset
df_merged = pd.merge(df_merged, df_shopping[['property_index'] + columns_to_append_shopping], 
                     on='property_index', how='left')

# Step 6: Save the merged dataset
output_path = '/home/Daniel Bi/project two/data/landing/rental_merged.csv'
df_merged.to_csv(output_path, index=False)

print(f"Merged dataset saved at {output_path}")




Merged dataset saved at /home/Daniel Bi/project two/data/landing/rental_merged.csv
