In [None]:
!pip install pandas matplotlib seaborn scikit-learn

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

%matplotlib inline

data = {
    'Date': pd.date_range(start='2025-01-01', periods=10, freq='D'),
    'Category': ['Electronics', 'Clothing', 'Groceries', 'Electronics', 'Clothing', 
                 'Groceries', 'Electronics', 'Clothing', 'Groceries', 'Electronics'],
    'Sales': [1200, 800, 600, 1500, 700, 900, 1100, 950, 620, 1400],
    'Customer_Rating': [4.5, 3.8, 4.2, 4.7, 3.5, 4.0, 4.6, 3.9, 4.1, 4.8]
}

df = pd.DataFrame(data)

df.to_csv('sales_dataset.csv', index=False)

try:
    df = pd.read_csv("sales_dataset.csv")
except FileNotFoundError:
    print("Error: File not found. Check the path!")
except Exception as e:
    print(f"An error occurred: {e}")

df.head()
df.info()
df.isnull().sum()
df.fillna(df.select_dtypes(include=['number']).mean(), inplace=True)
df.describe()
df.groupby('Category')['Sales'].mean()

df.plot(x='Date', y='Sales', kind='line', figsize=(8,5))
plt.title('Sales Trends Over Time')
plt.xlabel('Date')
plt.ylabel('Sales')
plt.show()

sns.barplot(x='Category', y='Sales', data=df)
plt.title('Average Sales Per Category')
plt.xlabel('Category')
plt.ylabel('Average Sales')
plt.show()

df['Sales'].hist(bins=30)
plt.title('Distribution of Sales')
plt.xlabel('Sales')
plt.ylabel('Frequency')
plt.show()

sns.scatterplot(x='Customer_Rating', y='Sales', data=df)
plt.title('Customer Rating vs Sales')
plt.xlabel('Customer Rating')
plt.ylabel('Sales')
plt.show()
