In [None]:
# Import necessary libraries
import pandas as pd
import matplotlib.pyplot as plt

# Load the dataset
file_path = 'Import Export Trade data EU.csv'  # Adjust the path as needed
df = pd.read_csv(file_path)

# Data Cleaning
# Convert the 'date' column to datetime format
df['date'] = pd.to_datetime(df['date'])

# Standardize column names (optional)
df.columns = df.columns.str.lower().str.replace(' ', '_')

# Exploratory Data Analysis (EDA)
# Top 5 Importers by Total Trade Value
top_importers = df.groupby('importer_name')['total_cif_value'].sum().nlargest(5)
print("Top 5 Importers by Total Trade Value (USD):")
print(top_importers)

# Plotting top importers
plt.figure(figsize=(10, 6))
top_importers.plot(kind='bar')
plt.title('Top 5 Importers by Total Trade Value')
plt.xlabel('Importer Name')
plt.ylabel('Total Trade Value (USD)')
plt.xticks(rotation=45, ha='right')
plt.show()

# Top Exporting Countries by Total Trade Value
top_exporting_countries = df.groupby('export_country')['total_cif_value'].sum().nlargest(5)
print("Top 5 Exporting Countries by Total Trade Value (USD):")
print(top_exporting_countries)

# Plotting top exporting countries
plt.figure(figsize=(10, 6))
top_exporting_countries.plot(kind='bar', color='skyblue')
plt.title('Top 5 Exporting Countries by Total Trade Value')
plt.xlabel('Export Country')
plt.ylabel('Total Trade Value (USD)')
plt.xticks(rotation=45, ha='right')
plt.show()

# Top Products by HS Code
top_products = df.groupby('hs_code')['total_cif_value'].sum().nlargest(5)
print("Top 5 Products by HS Code:")
print(top_products)

# Plotting top products by HS Code
plt.figure(figsize=(10, 6))
top_products.plot(kind='bar', color='green')
plt.title('Top 5 Products by HS Code')
plt.xlabel('HS Code')
plt.ylabel('Total Trade Value (USD)')
plt.xticks(rotation=45, ha='right')
plt.show()

# Monthly Trade Trends (focusing on August 2020 as per your report)
monthly_trade = df[df['month'] == 'August'].groupby(['month', 'year'])['total_cif_value'].sum()
print("Total Trade Value in August 2020:")
print(monthly_trade)

# Plotting monthly trade trends
plt.figure(figsize=(10, 6))
monthly_trade.plot(kind='line', marker='o', color='red')
plt.title('Total Trade Value in August 2020')
plt.xlabel('Month-Year')
plt.ylabel('Total Trade Value (USD)')
plt.grid(True)
plt.show()

# Conclusion
"""
This notebook provides a detailed analysis of the import-export trade data.
Key insights include:
- Identification of top importers, exporting countries, and products based on HS codes.
- Analysis of monthly trade trends, highlighting a spike in August 2020.
You can further explore the dataset by adjusting the visualizations or focusing on other time periods or products.
"""
