In [None]:
import pandas as pd
import geopandas as gpd
from shapely.geometry import Point
import matplotlib.pyplot as plt
import seaborn as sns
from statsmodels.tsa.seasonal import seasonal_decompose
import matplotlib.dates as mdates

In [None]:
df = pd.read_csv('filtered_data.csv')
df.info()

In [None]:
# remove none rows
df = df.dropna()

In [None]:
# Step 2: Convert 'date' column to datetime
df['date'] = pd.to_datetime(df['standard_date'])

# Step 3: Extract year and month from 'date'
df['year'] = df['date'].dt.year
df['month'] = df['date'].dt.month

# Step 4: Create geometry column from longitude and latitude
df['geometry'] = df.apply(lambda row: Point(row['lon'], row['lat']), axis=1)

# Step 5: Convert DataFrame to GeoDataFrame
gdf = gpd.GeoDataFrame(df, geometry='geometry')

# Step 6: Set coordinate reference system to WGS84
gdf.set_crs(epsg=4326, inplace=True)

# Optional: Read Mexico City shapefile for map overlay (if available)
city_map = gpd.read_file('poligonos_alcaldias_cdmx')

In [None]:
gdf = gpd.clip(gdf, city_map)
gdf.info()