In [None]:
import pandas as pd

# Load the dataset
url = 'path_to_your_dataset.csv'  # Replace with the actual path to your dataset
climate_data = pd.read_csv(url)

# Display the first few rows of the dataset
print(climate_data.head())

In [None]:
# Check for missing values
print(climate_data.isnull().sum())

# Drop rows with missing values (if any)
climate_data.dropna(inplace=True)

# Convert date column to datetime format (assuming there's a 'date' column)
climate_data['date'] = pd.to_datetime(climate_data['date'])

# Display the cleaned data
print(climate_data.info())

In [None]:
import matplotlib.pyplot as plt

# Filter data for Tunisia and Cameroon
tunisia_data = climate_data[climate_data['country'] == 'Tunisia']
cameroon_data = climate_data[climate_data['country'] == 'Cameroon']

# Plotting
plt.figure(figsize=(12, 6))
plt.plot(tunisia_data['date'], tunisia_data['avg_temp'], label='Tunisia', color='blue')
plt.plot(cameroon_data['date'], cameroon_data['avg_temp'], label='Cameroon', color='orange')
plt.title('Average Temperature Fluctuations in Tunisia and Cameroon (1980-2023)')
plt.xlabel('Year')
plt.ylabel('Average Temperature (°C)')
plt.legend()
plt.grid()
plt.show()

In [None]:
# Filter data between 1980 and 2005
filtered_data = climate_data[(climate_data['date'] >= '1980-01-01') & (climate_data['date'] <= '2005-12-31')]

# Plotting
plt.figure(figsize=(12, 6))
plt.plot(filtered_data[filtered_data['country'] == 'Tunisia']['date'], 
         filtered_data[filtered_data['country'] == 'Tunisia']['avg_temp'], label='Tunisia', color='blue')
plt.plot(filtered_data[filtered_data['country'] == 'Cameroon']['date'], 
         filtered_data[filtered_data['country'] == 'Cameroon']['avg_temp'], label='Cameroon', color='orange')
plt.title('Average Temperature Fluctuations in Tunisia and Cameroon (1980-2005)')
plt.xlabel('Year')
plt.ylabel('Average Temperature (°C)')
plt.xticks(rotation=45)
plt.legend()
plt.grid()
plt.show()

In [None]:
# Filter data for Senegal
senegal_data = climate_data[climate_data['country'] == 'Senegal']

# Filter for the two time periods
senegal_1980_2000 = senegal_data[(senegal_data['date'] >= '1980-01-01') & (senegal_data['date'] <= '2000-12-31')]
senegal_2000_2023 = senegal_data[(senegal_data['date'] > '2000-12-31') & (senegal_data['date'] <= '2023-12-31')]

# Plotting histograms
plt.figure(figsize=(12, 6))
plt.hist(senegal_1980_2000['avg_temp'], bins=20, alpha=0.5, label='1980-2000', color='blue')
plt.hist(senegal_2000_2023['avg_temp'], bins=20, alpha=0.5, label='2000-2023', color='orange')
plt.title('Temperature Distribution in Senegal')
plt.xlabel('Average Temperature (°C)')
plt.ylabel('Frequency')
plt.legend()
plt.grid()
plt.show()