In [None]:
from google.colab import drive
drive.mount('/content/drive')

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
from matplotlib.ticker import FuncFormatter
file_path = '/content/drive/MyDrive/Cleans.xlsx'

In [None]:
"""Introduction
Goal:Top-selling products,Total Sales per Month & Sale Trend,Percentage of Canceled Orders,Top 3 States & City with Canceled Orders,
    Proportion of Service Levels (Standard vs. Expedited)"""
df = pd.read_excel(file_path)
df

In [None]:
df.info()

In [None]:
df.columns

In [None]:
# Calculate the percentage of orders that were cancelled
Cancelled_Order = df[df['CourierStatus'] == 'Cancelled'].shape[0]
Total_Order = df.shape[0]
Cancelled_Percent = Cancelled_Order / Total_Order * 100
print(f"Percentage of cancelled orders: {Cancelled_Percent:.2f}%")

In [None]:
#Top 3 state cancelled
State_Cancelled = df[df['CourierStatus'] == 'Cancelled']
Cancelled_By_State = State_Cancelled['Ship_State'].value_counts().head(3)
Cancelled_By_State

In [None]:
#Top 3 city cancelled
City_Cancelled = df[df['CourierStatus'] == 'Cancelled']
Cancelled_By_City = City_Cancelled['Ship_City'].value_counts().head(3)
Cancelled_By_City

In [None]:
# Set the background color of the plot to black
plt.style.use('dark_background')

# Count the number of orders for each service level (Standard and Expedited)
Service_Level_Counts = df['ShipServiceLevel'].value_counts()

# Get the counts for 'Standard' and 'Expedited' (if not present, default to 0)
Standard_Count = Service_Level_Counts.get('Standard', 0)
Expedited_Count = Service_Level_Counts.get('Expedited', 0)

# Data for the pie chart
labels = ['Standard', 'Expedited']
sizes = [Standard_Count, Expedited_Count]

# Create the pie chart with percentages shown on the chart
plt.figure(figsize=(6,6))
plt.pie(sizes, labels=labels, autopct='%1.1f%%', startangle=140, colors=['white', 'skyblue'])

# Set the title of the plot
plt.title('Proportion of Service Level (Standard vs Expedited)', color='white')

# Display the plot
plt.show()


'Most customers prefer Expedited service, it suggests that delivery speed is an important factor in their purchasing decisions.'

In [None]:
# Create a bar chart for total sales per month
df['Date'] = pd.to_datetime(df['Date']).dt.month
monthly_sales = df.groupby('Date')['Amount'].sum()
monthly_sales.plot(kind='bar', figsize=(10, 6), color='skyblue')

# Set the title of the chart
plt.title('Total Sales Per Month', fontsize=16)

# Set the labels for the X and Y axes
plt.xlabel('Month', fontsize=12)
plt.ylabel('Total Sales', fontsize=12)

# Use FuncFormatter to display the Y-axis labels as full numbers (without scientific notation)
formatter = FuncFormatter(lambda x, _: f'{x:,.0f}')
plt.gca().yaxis.set_major_formatter(formatter)

# Display the chart
plt.show()

"From the Total sales data of the past 3 months, there is a clear short-term downward trend in sales."

In [None]:
#Top 3 Category
Top_Cat = df.groupby('Category')['Amount'].size().sort_values(ascending=False).head(3)
Top_Cat

"Set as the Category with the highest sales and approximately 40% of total orders."

 Key Insights


1.  -Total sales data of the past 3 months, there is a clear short-term downward trend in sales.

2. -Most customers prefer Expedited
3. -"Set" as the Category with the highest sales and approximately 40% of total orders.

Recommendations

Boost short-term sales: Investigate possible reasons for the recent decline (Ex. seasonal effects, end of promotions, stock issues). Launch short-term promotions or marketing campaigns during low-sales periods to recover momentum.

Leverage shipping preference: Since customers prefer Expedited shipping, ensure service quality and delivery consistency. Offer limited-time shipping discounts to encourage more customers to choose Expedited service.

Focus on the “Set” category: Invest in expanding or promoting products under the “Set” category, as it generates the highest revenue share. Analyze sub-products in this category to identify new opportunities for product bundling or cross-selling.

Conclusion

From the E-commerce sales  

-A short-term decline in overall sales, requiring proactive marketing actions.

-A strong customer preference for fast delivery, highlighting logistics as a competitive advantage.

-The “Set” category is the main revenue driver and should remain a focus for future sales growth.


In summary: Maintaining efficient Expedited delivery services, reinforcing marketing efforts for high-performing categories, and running targeted promotions during slow sales periods can help sustain growth and improve customer satisfaction.