In [None]:
# Calculate the total population growth in Europe between 2000 and 2010.
# Identify the top 5 European countries by population growth during this period.
# Create a line plot showing the population changes of these countries from 2000 to 2010.

import pandas as pd
import matplotlib.pyplot as plt

# Load the dataset
data = pd.read_csv('population.csv')

# Filter the data for the years 2000 and 2010, and for the continent Europe
data_europe_2000 = data[(data['year'] == 2000) & (data['continent'] == 'Europe')]
data_europe_2010 = data[(data['year'] == 2010) & (data['continent'] == 'Europe')]

# Merge the 2000 and 2010 data for European countries
europe_growth = pd.merge(data_europe_2000[['country name', 'population']], 
                         data_europe_2010[['country name', 'population']], 
                         on='country name', 
                         suffixes=('_2000', '_2010'))

# Calculate the population growth for each country
europe_growth['growth'] = europe_growth['population_2010'] - europe_growth['population_2000']

# Calculate the total population growth for Europe between 2000 and 2010
total_growth_europe = europe_growth['growth'].sum()
print(f"Total population growth in Europe between 2000 and 2010: {total_growth_europe} million")

# Identify the top 5 countries by population growth
top_5_growth = europe_growth.nlargest(5, 'growth')

# Display the top 5 countries by population growth
print("\nTop 5 European countries by population growth between 2000 and 2010:")
print(top_5_growth[['country name', 'growth']])

# Create a line plot showing the population changes of these countries from 2000 to 2010
top_5_countries = top_5_growth['country name'].tolist()
top_5_data = data_europe_2000[data_europe_2000['country name'].isin(top_5_countries)]

# Merge the 2000 and 2010 data for the top 5 countries
top_5_data_2010 = data_europe_2010[data_europe_2010['country name'].isin(top_5_countries)]
top_5_data_combined = pd.concat([top_5_data[['country name', 'year', 'population']], 
                                 top_5_data_2010[['country name', 'year', 'population']]])

# Plotting the line plot
plt.figure(figsize=(12, 6))
for country in top_5_countries:
    country_data = top_5_data_combined[top_5_data_combined['country name'] == country]
    plt.plot(country_data['year'], country_data['population'], marker='o', label=country)

plt.xlabel('Year', fontsize=12)
plt.ylabel('Population (in millions)', fontsize=12)
plt.title('Population Changes in the Top 5 European Countries (2000-2010)', fontsize=14)
plt.legend()
plt.grid(True)
plt.tight_layout()
plt.show()

NameError: name 'europe_data_2000' is not defined