# Day 5 – Item Popularity Features
This notebook analyzes item-level statistics such as clicks, carts, orders, CTR and CVR.

In [None]:
# Step 1: 商品行为次数统计
aid_stats = df.groupby(['aid', 'type_name']).size().unstack(fill_value=0)
aid_stats.head()

In [None]:
# Step 2: 构建转化率特征
aid_stats['CTR'] = aid_stats['carts'] / (aid_stats['clicks'] + 1e-5)
aid_stats['CVR'] = aid_stats['orders'] / (aid_stats['clicks'] + 1e-5)
aid_stats[['clicks', 'carts', 'orders', 'CTR', 'CVR']].head()

In [None]:
# Step 3: 找出最热门商品并可视化
top_clicks = aid_stats.sort_values(by='clicks', ascending=False).head(20)
import matplotlib.pyplot as plt
plt.figure(figsize=(10,6))
top_clicks['clicks'][::-1].plot(kind='barh', color='#8da0cb')
plt.title("Top 20 Most Clicked Items")
plt.xlabel("Clicks")
plt.ylabel("Item ID (aid)")
plt.grid(axis='x')
plt.show()

In [None]:
# Step 4: 保存为 CSV 供后续使用
aid_stats.to_csv('aid_level_features.csv')