In [None]:
import pandas as pd
import matplotlib.pyplot as plt
from scipy.stats import linregress

In [None]:
# Import data
df = pd.read_csv("epa-sea-level.csv")

# Create scatter plot
plt.figure(figsize=(10, 6))
plt.scatter(df["Year"], df["CSIRO Adjusted Sea Level"], s=10)
plt.xlabel("Year")
plt.ylabel("Sea Level (inches)")
plt.title("Rise in Sea Level")

# Line of best fit (using all data)
slope, intercept, r_value, p_value, std_err = linregress(df["Year"], df["CSIRO Adjusted Sea Level"])
x_pred = pd.Series(range(1880, 2051))  # extend through 2050
y_pred = intercept + slope * x_pred
plt.plot(x_pred, y_pred, 'r', label="Best fit: 1880–2050")

# Line of best fit (using data from year 2000 onward)
df_recent = df[df["Year"] >= 2000]
slope_recent, intercept_recent, r_value_recent, p_value_recent, std_err_recent = linregress(
    df_recent["Year"], df_recent["CSIRO Adjusted Sea Level"]
)
x_recent = pd.Series(range(2000, 2051))
y_recent = intercept_recent + slope_recent * x_recent
plt.plot(x_recent, y_recent, 'g', label="Best fit: 2000–2050")

# Add legend
plt.legend()

# Save and show plot
plt.savefig("sea_level_plot.png")
plt.show()
