In [1]:
import geopandas as gpd
import pandas as pd
import seaborn as sns
from matplotlib import pyplot as plt

In [3]:
df = pd.read_csv('../datasets/strava_edges_2021.csv')

### Basic dataset info

1. `edge_uid` is strava specific ID for a street
2. `osm_reference_id` should be OpenStreetMap way ID - could be a way to match other datasets
3. valuable number: `forward_trip_count`/`reverse_trip_count`  
4. It's possible to download commute data only - leisure trips excluded: Find the quantitative difference
5. maybe export dataset by month/week - possible to aggregate and match with other datasets

In [4]:
display(df.head())
display(f"Shape: {df.shape}")
display("Columns:", df.columns)
display(df.describe())

Unnamed: 0,edge_uid,activity_type,year,forward_trip_count,reverse_trip_count,forward_people_count,reverse_people_count,forward_commute_trip_count,reverse_commute_trip_count,forward_leisure_trip_count,...,reverse_20_34_people_count,forward_35_54_people_count,reverse_35_54_people_count,forward_55_64_people_count,reverse_55_64_people_count,forward_65_plus_people_count,reverse_65_plus_people_count,forward_average_speed,reverse_average_speed,osm_reference_id
0,160893973,Ride,2021,5,30,5,15,0,0,5,...,0,5,10,0,0,0,0,5.94,3.15,93103358
1,160900085,Ride,2021,5,0,5,0,0,0,5,...,0,5,0,0,0,0,0,1.36,0.0,65201855
2,160901788,Ride,2021,65,65,60,55,5,5,60,...,20,25,20,5,5,0,0,0.56,0.35,33968694
3,160901895,Ride,2021,255,400,85,100,25,20,230,...,20,55,55,0,5,0,0,2.66,4.61,108343596
4,160902450,Ride,2021,75,185,70,130,5,15,70,...,30,35,60,0,10,0,5,2.03,2.6,74064352


'Shape: (193812, 34)'

'Columns:'

Index(['edge_uid', 'activity_type', 'year', 'forward_trip_count',
       'reverse_trip_count', 'forward_people_count', 'reverse_people_count',
       'forward_commute_trip_count', 'reverse_commute_trip_count',
       'forward_leisure_trip_count', 'reverse_leisure_trip_count',
       'forward_morning_trip_count', 'reverse_morning_trip_count',
       'forward_evening_trip_count', 'reverse_evening_trip_count',
       'forward_male_people_count', 'reverse_male_people_count',
       'forward_female_people_count', 'reverse_female_people_count',
       'forward_unspecified_people_count', 'reverse_unspecified_people_count',
       'forward_13_19_people_count', 'reverse_13_19_people_count',
       'forward_20_34_people_count', 'reverse_20_34_people_count',
       'forward_35_54_people_count', 'reverse_35_54_people_count',
       'forward_55_64_people_count', 'reverse_55_64_people_count',
       'forward_65_plus_people_count', 'reverse_65_plus_people_count',
       'forward_average_speed', 'reve

Unnamed: 0,edge_uid,year,forward_trip_count,reverse_trip_count,forward_people_count,reverse_people_count,forward_commute_trip_count,reverse_commute_trip_count,forward_leisure_trip_count,reverse_leisure_trip_count,...,reverse_20_34_people_count,forward_35_54_people_count,reverse_35_54_people_count,forward_55_64_people_count,reverse_55_64_people_count,forward_65_plus_people_count,reverse_65_plus_people_count,forward_average_speed,reverse_average_speed,osm_reference_id
count,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,...,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0,193812.0
mean,161987600.0,2021.0,328.296674,299.673266,122.016774,114.457619,52.651229,44.795859,275.645445,254.877407,...,40.220265,55.902472,52.790952,4.376638,4.11925,1.105607,1.054579,4.053632,3.8167,288277100.0
std,1366626.0,0.0,1000.382059,947.005243,269.185387,261.843734,243.399422,216.46787,804.559041,773.482855,...,106.047168,115.831211,112.967226,9.626298,9.36967,2.968917,2.965756,4.211878,5.409011,277694800.0
min,160865700.0,2021.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4019269.0
25%,161036600.0,2021.0,10.0,10.0,5.0,5.0,0.0,0.0,10.0,10.0,...,0.0,5.0,5.0,0.0,0.0,0.0,0.0,2.0,1.8,52010290.0
50%,161099500.0,2021.0,50.0,40.0,25.0,25.0,5.0,5.0,40.0,35.0,...,5.0,15.0,10.0,0.0,0.0,0.0,0.0,3.74,3.6,177655500.0
75%,161970300.0,2021.0,255.0,220.0,120.0,105.0,20.0,20.0,215.0,190.0,...,35.0,55.0,50.0,5.0,5.0,0.0,0.0,5.4,5.27,430820500.0
max,165160500.0,2021.0,27120.0,27210.0,4775.0,4790.0,7965.0,8030.0,21610.0,21775.0,...,2175.0,1810.0,1810.0,125.0,130.0,45.0,50.0,363.99,1468.95,1023971000.0
