In [None]:
# Step 1: Import required libraries
import pandas as pd
import matplotlib.pyplot as plt

# Step 2: Load the CSV file
df = pd.read_csv('sales_data.csv')  # Ensure file is in the same folder

# Step 3: Display the first few rows
print("First 5 rows of the dataset:")
print(df.head())

# Step 4: Dataset information
print("\nDataset Information:")
print(df.info())

# Step 5: Summary statistics
print("\nSummary Statistics:")
print(df.describe())

# Step 6: Group by Region and calculate total sales
# Make sure column names exactly match your CSV
grouped_data = df.groupby('Region')['Sales'].sum()
print("\nTotal Sales by Region:")
print(grouped_data)

# Step 7: Bar chart for sales by region
plt.figure(figsize=(8, 5))
grouped_data.plot(kind='bar', color='skyblue')
plt.title('Total Sales by Region')
plt.xlabel('Region')
plt.ylabel('Sales')
plt.xticks(rotation=45)
plt.grid(axis='y', linestyle='--', alpha=0.7)
plt.tight_layout()
plt.show()

# Step 8: Monthly Sales Trend (if 'Date' column exists)
if 'Date' in df.columns:
    df['Date'] = pd.to_datetime(df['Date'])  # Convert to datetime
    df['Month'] = df['Date'].dt.to_period('M')  # Extract year-month

    monthly_sales = df.groupby('Month')['Sales'].sum()

    plt.figure(figsize=(10, 4))
    monthly_sales.plot(kind='line', marker='o', color='green', title='Monthly Sales Trend')
    plt.xlabel('Month')
    plt.ylabel('Sales')
    plt.grid(True)
    plt.tight_layout()
    plt.show()
