In [None]:
import pandas as pd
import numpy as np
from datetime import datetime

# Sample data loading
data_BM = pd.read_csv(r'C:\path\to\data.csv')

# 1. Sorting and Aggregating Data
data_BM.sort_values(by=['grade', 'marks'], inplace=True)
print(data_BM.head())

# 2. Concatenating Multiple DataFrames
outlet_size_small = pd.read_csv(r'C:\path\to\outlet_size_small.csv')
outlet_size_medium = pd.read_csv(r'C:\path\to\outlet_size_medium.csv')
outlet_size_high = pd.read_csv(r'C:\path\to\outlet_size_high.csv')

final_list = [outlet_size_small, outlet_size_medium, outlet_size_high]
combined_data = pd.concat(final_list, ignore_index=True)
print(combined_data.shape)

# 3. Performing SQL-like Joins
previous_data = pd.read_csv(r'C:\path\to\previous_data.csv')
Outlet_data = pd.read_csv(r'C:\path\to\outlet_data.csv')

combined_data = previous_data.merge(Outlet_data, how='left', on='Outlet_Identifier')
print(combined_data.head())

# 4. Statistical Calculations
print(data_BM['Item_MRP'].sum())
print(data_BM['Item_MRP'].mean())
print(data_BM['Item_MRP'].median())
print(data_BM['Outlet_Size'].mode())
print(data_BM.describe())

# 5. Grouping and Pivot Tables
grouped_data = data_BM.groupby(['Outlet_Size', 'Item_Type']).mean()
print(grouped_data['Item_MRP'])

pivot_table = pd.pivot_table(data_BM, index='Item_Type', values='Item_MRP', aggfunc='mean')
print(pivot_table)

# 6. Preprocessing Time Series Data
time_series_data = pd.read_csv(r'C:\path\to\time_series.csv')

# Convert to datetime
time_series_data['Datetime'] = pd.to_datetime(time_series_data['Datetime'])
time_series_data['day_name'] = time_series_data['Datetime'].dt.day_name()
time_series_data['month'] = time_series_data['Datetime'].dt.month
print(time_series_data.head())

# 7. Transforming Data (Average Item Visibility)
data_BM['avg_item_visibility_1'] = data_BM.groupby('Item_Identifier')['Item_Visibility'].transform('mean')
print(data_BM.head())

# Example of handling Unix timestamps
unix_data = pd.read_csv(r'C:\path\to\data_with_timestamp.csv')
unix_data['timestamp'] = pd.to_datetime(unix_data['timestamp'], unit='s')
print(unix_data.head())
