# Data Demonstration

This code was to create the summary statistics in my presentation about my datapoints. 

In [None]:
import pandas as pd
from pandas import DataFrame

In [None]:
atl_data = {
    "weekendPeak": pd.read_csv("./data/classified_data_atl_peakWn.csv"),
    "weekendOffPeak": pd.read_csv("./data/classified_data_atl_oPeakWn.csv"),
    "weekdayPeak": pd.read_csv("./data/classified_data_atl_peakWd.csv"),
    "weekdayOffPeak": pd.read_csv("./data/classified_data_atl_oPeakWd.csv")
}

clt_data = {
    "weekendPeak": pd.read_csv("./data/classified_data_clt_peakWn.csv"),
    "weekendOffPeak": pd.read_csv("./data/classified_data_clt_oPeakWn.csv"),
    "weekdayPeak": pd.read_csv("./data/classified_data_clt_peakWd.csv"),
    "weekdayOffPeak": pd.read_csv("./data/classified_data_clt_oPeakWd.csv")
}

In [None]:
# Possible Behaviors:
# 1. no behavior (standing still)
# 2. standard landing
# 3. going around
# 4. switching sides
# 5. flyby
# 6. Unknown

def print_behavior_count(data: DataFrame, key: str): 
    print(f"Behavior Count {key}:")
    print("\tNo Behavior: ", len(data[data["behavior"] == 1]))
    print("\tStandard Landing: ", len(data[data["behavior"] == 2]))
    print("\tGoing Around: ", len(data[data["behavior"] == 3]))
    print("\tSwitching Sides: ", len(data[data["behavior"] == 4]))
    print("\tFlyby: ", len(data[data["behavior"] == 5]))
    print("\tUnknown: ", len(data[data["behavior"] == 6]))
    print()

In [None]:
## print totals for each city
print("ATL Behavior Counts")
print("=====================================")

## Combine all dataframes in atl_data
atl_combined = pd.concat(atl_data.values(), ignore_index=True)
print_behavior_count(atl_combined, "ALL TIMES")
## Print behavior counts for each individual dataframe
for key, data in atl_data.items():
    print_behavior_count(data, key)

print("CLT Behavior Counts")
print("=====================================")
## Combine all dataframes in clt_data
clt_combined = pd.concat(clt_data.values(), ignore_index=True)
print_behavior_count(clt_combined, "ALL TIMES")
for key, data in clt_data.items():
    print_behavior_count(data, key)

ATL Behavior Counts
Behavior Count ALL TIMES:
	No Behavior:  304617
	Standard Landing:  129551
	Going Around:  0
	Switching Sides:  5478
	Flyby:  6703
	Unknown:  31200

Behavior Count weekendPeak:
	No Behavior:  138539
	Standard Landing:  43688
	Going Around:  0
	Switching Sides:  494
	Flyby:  3787
	Unknown:  17659

Behavior Count weekendOffPeak:
	No Behavior:  2745
	Standard Landing:  0
	Going Around:  0
	Switching Sides:  0
	Flyby:  0
	Unknown:  258

Behavior Count weekdayPeak:
	No Behavior:  42807
	Standard Landing:  13215
	Going Around:  0
	Switching Sides:  494
	Flyby:  1177
	Unknown:  9611

Behavior Count weekdayOffPeak:
	No Behavior:  120526
	Standard Landing:  72648
	Going Around:  0
	Switching Sides:  4490
	Flyby:  1739
	Unknown:  3672

CLT Behavior Counts
Behavior Count ALL TIMES:
	No Behavior:  224516
	Standard Landing:  22119
	Going Around:  0
	Switching Sides:  2000
	Flyby:  1614
	Unknown:  20049

Behavior Count weekendPeak:
	No Behavior:  55429
	Standard Landing:  3800
	G

In [None]:
import pandas as pd

# List to collect all row dictionaries
rows = []

# For each city and its corresponding data
for city, city_data in [("ATL", atl_data), ("CLT", clt_data)]:
    for key, data in city_data.items():
        row = {"city": city, "time": key}
        for behavior in range(1, 7):  # Behaviors 1 through 6
            count = len(data[data["behavior"] == behavior])
            row[f"behavior_{behavior}"] = count
        rows.append(row)

# Create final DataFrame
newData = pd.DataFrame(rows)

# Write to CSV
newData.to_csv("./data/behavior_counts.csv", index=False)