# Task 5 - Data Analysis on CSV Files

This notebook demonstrates a basic sales-data analysis using Pandas: loading CSV, inspecting data, grouping, aggregation, and plotting. It uses the included `sales_data.csv`.


In [None]:

import pandas as pd
df = pd.read_csv('sales_data.csv', parse_dates=['Date'])
print('Shape:', df.shape)
df.head()


In [None]:

# Basic info and missing values
df.info()
print('\nMissing values per column:\n', df.isna().sum())


In [None]:

# Aggregate sales by Category and Region
cat_sales = df.groupby('Category').Sales.sum().sort_values(ascending=False)
reg_sales = df.groupby('Region').Sales.sum().sort_values(ascending=False)
display(cat_sales)
display(reg_sales)


In [None]:

# Monthly sales trend
df['Month'] = pd.to_datetime(df['Date']).dt.to_period('M').astype(str)
monthly = df.groupby('Month').Sales.sum().sort_index()
monthly.plot(kind='line', marker='o', figsize=(10,4), title='Monthly Sales Trend')


In [None]:

# Save plots to files (already saved in submission folder)
from IPython.display import Image, display
display(Image('sales_by_category.png'))
display(Image('sales_by_region.png'))
display(Image('monthly_sales_trend.png'))
