**business performance optimization**

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

In [None]:
df = pd.read_csv("Sample - Superstore.csv")
df.head(4)

In [None]:
df.isnull().sum()

In [None]:
df.info()

**profit by region**

In [None]:
region = df.groupby('Region')[['Sales', 'Profit']].sum().sort_values(by='Profit', ascending=False)
region

In [None]:
import os
os.makedirs("images", exist_ok=True)

In [None]:
sns.barplot(x=region.index, y=region['Profit'])
plt.title("Profit by Region")
plt.savefig("images/barplot.png", dpi=300, bbox_inches="tight")
plt.show()

**profit margin by category**

In [None]:
category = df.groupby('Category')[['Sales', 'Profit']].sum()
category['Profit Margin'] = category['Profit'] / category['Sales']
category.sort_values('Profit Margin', ascending=False)

In [None]:
cat_profit = df.groupby('Category')['Profit'].sum().sort_values(ascending=False)
cat_profit.plot(kind='bar', title='Profit by Product Category')
plt.savefig("images/plot.png", dpi=300, bbox_inches="tight")

plt.show()

**correlation analysis**

In [None]:
sns.heatmap(df[['Sales', 'Profit', 'Discount', 'Quantity']].corr(), annot=True, cmap='Blues')
plt.title('Correlation Heatmap')
plt.savefig("images/heatmap.png", dpi=300, bbox_inches="tight")
plt.show()

**Discount Impact on Profit**

In [None]:
sns.scatterplot(data=df, x='Discount', y='Profit', alpha=0.6)
plt.title("Effect of Discount on Profit")
plt.savefig("images/scatterplot.png", dpi=300, bbox_inches="tight")
plt.show()

In [None]:
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression

In [None]:
X = df[['Sales', 'Quantity', 'Discount']]
y = df['Profit']

In [None]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [None]:
model = LinearRegression()
model.fit(X_train, y_train)

In [None]:
print("RÂ² Score:", model.score(X_test, y_test))
print("Coefficients:", list(zip(X.columns, model.coef_)))

In [None]:
new_discount = df['Discount'] * 0.9
predicted_profit = model.predict(df[['Sales', 'Quantity', 'Discount']].assign(Discount=new_discount)[['Sales', 'Quantity', 'Discount']]
)
improvement = predicted_profit.mean() - df['Profit'].mean()

print(f"Expected Profit Improvement: {improvement:.2f}")