In [None]:
import pandas as pd

# Load the cleaned data

In [None]:
df = pd.read_csv("quakes-cleaned.csv")
df['time'] = pd.to_datetime(df['time'], errors='coerce', format='mixed')

# 1. Top 5 High-Risk Zones
# Group by latitude and longitude to find the most active zones

In [None]:
high_risk_zones = df.groupby(['latitude', 'longitude']).size().reset_index(name='count')
high_risk_zones = high_risk_zones.sort_values(by='count', ascending=False).head(5)
print("Top 5 High-Risk Zones:")
print(high_risk_zones)

# 2. The Most Seismic Activity in a Local Area
# Find the area with the highest number of seismic events

In [None]:
most_seismic_area = high_risk_zones.iloc[0]
print(f"\nMost Seismic Area: Latitude {most_seismic_area['latitude']}, Longitude {most_seismic_area['longitude']} with {most_seismic_area['count']} events.")

# 3. Most Affected Places
# Count the number of earthquakes by 'place'

In [None]:
most_affected_places = df['place'].value_counts().reset_index().head(10)
most_affected_places.columns = ['place', 'count']
print("\nMost Affected Places:")
print(most_affected_places)

# 4. Earthquake Frequency by Hour
# Extract the hour from the 'time' column

In [None]:
df['hour'] = df['time'].dt.hour
earthquake_frequency_by_hour = df['hour'].value_counts().sort_index().reset_index()
earthquake_frequency_by_hour.columns = ['hour', 'frequency']
print("\nEarthquake Frequency by Hour:")
print(earthquake_frequency_by_hour)

# 5. Average Magnitude of All Earthquakes

In [None]:
avg_magnitude = df['mag'].mean()
print(f"\nAverage Magnitude of Earthquakes: {avg_magnitude:.2f}")