In [9]:
# Sales Dashboard in JupyterLab
# ===========================================================================
# This script sets up a JupyterLab environment for analyzing and visualizing sales data
# using pandas, numpy, openpyxl, matplotlib, and plotly.
# It reads data from an Excel file, processes it, and generates interactive visualizations.
# By Aman Anil
# =========================================================================== 

In [10]:
# Step 1: Import libraries
import pandas as pd
import matplotlib.pyplot as plt
import plotly.express as px

In [11]:
# Step 2: Load data from Excel
file_path = r'D:\personal\bdas.spyberpolymath.com\project\data\Sales_Dashboard.xlsx'
df = pd.read_excel(file_path)

In [12]:
# Step 3: Explore data
print("First 5 rows of data:")
display(df.head())

First 5 rows of data:


Unnamed: 0,Date,Region,Product,Sales
0,1970-01-01 05:30:45.658,East,C,674
1,1970-01-01 05:30:45.659,West,B,963
2,1970-01-01 05:30:45.660,North,B,842
3,1970-01-01 05:30:45.661,East,D,340
4,1970-01-01 05:30:45.662,East,B,663


In [13]:
# Step 4: Basic sales summary
total_sales = df['Sales'].sum()
print(f"Total Sales: {total_sales}")

sales_by_region = df.groupby('Region')['Sales'].sum().reset_index()
display(sales_by_region)

Total Sales: 58452


Unnamed: 0,Region,Sales
0,East,13291
1,North,13406
2,South,15237
3,West,16518


In [14]:
# Step 5: Plot sales by region using Plotly
fig = px.bar(sales_by_region, x='Region', y='Sales', title='Sales by Region', color='Sales')
fig.show()

In [15]:
# Step 6: Top products
sales_by_product = df.groupby('Product')['Sales'].sum().reset_index()
fig2 = px.pie(sales_by_product, names='Product', values='Sales', title='Sales by Product')
fig2.show()

In [16]:
# Step 7: Sales trend if date column exists
df['Date'] = pd.to_datetime(df['Date'])
sales_trend = df.groupby('Date')['Sales'].sum().reset_index()
fig3 = px.line(sales_trend, x='Date', y='Sales', title='Sales Trend Over Time')
fig3.show()