## Prepare the necessary data for the app

In [1]:
import os
import json
import pandas as pd

%cd ..

import src.configuration as config

/workspaces/Madesh10-aviation_final_project


In [2]:
# load dataset
data_path = os.path.join(os.getcwd(), "data", "processed", "combined_data.csv")
data_df = pd.read_csv(data_path)

In [3]:
# standardize the origin data to prevent duplicates
data_df['origin'] = data_df['origin'].str.strip().str.upper()
unique_origin = data_df['origin'].unique()
unique_origin

array(['CVG', 'LGA', 'GRR', ..., 'PN03', 'MS46', 'PACM'], dtype=object)

In [4]:
# standardize the destination data to prevent duplicates
data_df['destination'] = data_df['destination'].str.strip().str.upper()
unique_destination = data_df['destination'].unique()
unique_destination

array(['LGA', 'CVG', 'MSP', ..., 'MLY', 'OCH', 'PVB'], dtype=object)

In [5]:
# combine origin and destination to make a route
route_frequency = data_df['origin'] + '_' + data_df['destination']
route_frequency = route_frequency.value_counts().to_dict()
route_frequency

{'OGG_HNL': 974,
 'HNL_OGG': 972,
 'LAX_SFO': 948,
 'SFO_LAX': 947,
 'ORD_LGA': 922,
 'LGA_ORD': 917,
 'LAX_LAS': 879,
 'LAS_LAX': 875,
 'PHX_DEN': 806,
 'DEN_PHX': 801,
 'LAX_JFK': 775,
 'JFK_LAX': 774,
 'BOS_DCA': 771,
 'DCA_BOS': 769,
 'HNL_LIH': 709,
 'LIH_HNL': 705,
 'ATL_MCO': 685,
 'MCO_ATL': 670,
 'HNL_KOA': 669,
 'KOA_HNL': 668,
 'SLC_DEN': 649,
 'DEN_SLC': 648,
 'DEN_LAX': 637,
 'LAX_DEN': 632,
 'EWR_MCO': 632,
 'MCO_EWR': 629,
 'LAX_SEA': 625,
 'SEA_LAX': 624,
 'LAX_PHX': 619,
 'PHX_LAX': 615,
 'LAS_DEN': 612,
 'DEN_LAS': 611,
 'LAS_SAN': 601,
 'PHX_SEA': 599,
 'SAN_LAS': 599,
 'SEA_PHX': 598,
 'PDX_SEA': 589,
 'SEA_PDX': 587,
 'ATL_DCA': 586,
 'DCA_ATL': 586,
 'IAH_DFW': 585,
 'DFW_IAH': 583,
 'FLL_ATL': 579,
 'ATL_FLL': 579,
 'ATL_LGA': 575,
 'LGA_ATL': 574,
 'MIA_LGA': 573,
 'LGA_MIA': 572,
 'LAX_DFW': 567,
 'DFW_LAX': 567,
 'SEA_GEG': 557,
 'PHX_LAS': 556,
 'GEG_SEA': 556,
 'LGA_BOS': 554,
 'SAN_SFO': 553,
 'SFO_SAN': 553,
 'BOS_LGA': 553,
 'DFW_LGA': 553,
 'LAS_PHX': 55

In [6]:
# Define the full file path with the name 'unique_origin.json'
origin_path = os.path.join(config.STATIC_APP_ASSETS, 'unique_origin.json')
destination__path = os.path.join(config.STATIC_APP_ASSETS, 'unique_destination.json')
route_frequency_path = os.path.join(config.STATIC_APP_ASSETS, 'route_frequency.json')

# Save as JSON
with open(origin_path, 'w') as f:
    json.dump(unique_origin.tolist(), f)

with open(destination__path, 'w') as f:
    json.dump(unique_destination.tolist(), f)

with open(route_frequency_path, 'w') as f:
    json.dump(route_frequency, f)