In [12]:
import pandas as pd
import matplotlib.pyplot as plt
import os

print("Current working directory:", os.getcwd())

# Ensure folders exist
os.makedirs("visuals", exist_ok=True)
os.makedirs("report", exist_ok=True)

# Load data
df = pd.read_csv("sales_data.csv")
print("Columns in dataset:", df.columns)

# Clean data
df.dropna(inplace=True)

# Convert Date column
df['Date'] = pd.to_datetime(df['Date'])

# -----------------------------
# Visualization 1: Sales by Region
# -----------------------------
region_sales = df.groupby("Region")["Total_Sales"].sum()

plt.figure()
region_sales.plot(kind="bar")
plt.title("Total Sales by Region")
plt.xlabel("Region")
plt.ylabel("Total Sales")
plt.tight_layout()
plt.savefig("visuals/sales_by_region.png")
plt.close()

# -----------------------------
# Visualization 2: Monthly Sales Trend
# -----------------------------
df['Month'] = df['Date'].dt.month
monthly_sales = df.groupby("Month")["Total_Sales"].sum()

plt.figure()
monthly_sales.plot(kind="line", marker='o')
plt.title("Monthly Sales Trend")
plt.xlabel("Month")
plt.ylabel("Total Sales")
plt.tight_layout()
plt.savefig("visuals/monthly_sales_trend.png")
plt.close()

print("✅ Visuals saved inside visualizations/ folder")


Current working directory: C:\Users\Simranjeet\Desktop\The Developers Arena
Columns in dataset: Index(['Date', 'Product', 'Quantity', 'Price', 'Customer_ID', 'Region',
       'Total_Sales'],
      dtype='object')
✅ Visuals saved inside visualizations/ folder
