# Trader Behavior Insights
**Candidate:** Shambhavi Kulkarni

This notebook runs the full reproducible analysis for the assignment: loading data, cleaning, EDA, per-account analysis, and saving outputs in the required folder structure.


In [None]:
# Imports & paths
import pandas as pd
import matplotlib.pyplot as plt
import os
from datetime import datetime

root = '/content/drive/MyDrive/ds_Shambhavi_Kulkarni'  # Update this path when you mount your Drive in Colab
os.makedirs('outputs', exist_ok=True)


In [None]:
# Load datasets (upload to Colab or mount Drive)
trader = pd.read_csv('/content/e5b9901b-8d54-4472-acce-bf7d8e145269.csv')  # replace with your path in Colab
sent = pd.read_csv('/content/13525650-aed5-43f4-963c-809a157f394b.csv')  # replace with your path in Colab
trader.head()

In [None]:
# Preprocessing
trader['Timestamp IST'] = pd.to_datetime(trader['Timestamp IST'], format='%d-%m-%Y %H:%M', errors='coerce')
trader['Date'] = trader['Timestamp IST'].dt.date
sent['date'] = pd.to_datetime(sent['date'], format='%Y-%m-%d', errors='coerce')
sent['Date'] = sent['date'].dt.date

daily = trader.groupby('Date').agg({
    'Closed PnL': 'sum',
    'Size USD': 'sum',
    'Execution Price': 'mean'
}).reset_index()

merged = pd.merge(daily, sent[['Date','classification','value']], on='Date', how='inner')
merged.head()

In [None]:
# Quick EDA plots (matplotlib)
import matplotlib.pyplot as plt
plt.figure(figsize=(8,4))
merged.boxplot(column='Closed PnL', by='classification', grid=False)
plt.title('Closed PnL by Sentiment')
plt.suptitle('')
plt.savefig('outputs/boxplot_pnl_by_sentiment.png', bbox_inches='tight')
plt.show()

In [None]:
# Per-account summary
acct = trader.groupby('Account').agg({
    'Closed PnL': 'sum',
    'Size USD': 'sum',
    'Execution Price': 'mean',
    'Timestamp IST': 'count'
}).rename(columns={'Timestamp IST':'Trade Count'}).reset_index()
acct.sort_values('Closed PnL', ascending=False).head(20).to_csv('csv_files/top_20_accounts_by_pnl.csv', index=False)
acct.head()

## Next steps
- Replace placeholder paths with your Colab Drive paths.
- Run all cells and upload the notebook to Google Colab.
- Ensure `ds_<your_name>` folder is uploaded to your Drive and link is shared with view access.