# Walmart Purchase Behavior Analysis - Python (Pandas, NumPy)

In [None]:

# Walmart Customer Purchase Behavior Analysis

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Load the data
df = pd.read_csv("walmart.csv")

# Check basic info
print(df.info())

# Summary statistics
print(df.describe())

# Check for missing values
print(df.isnull().sum())

# Add derived metrics
df['City_Category'] = df['City_Category'].astype('category')
df['Age'] = df['Age'].astype('category')

# Purchase by Gender
gender_purchase = df.groupby('Gender')['Purchase'].mean().sort_values(ascending=False)
print("Average Purchase by Gender:\n", gender_purchase)

# Purchase by Age Group
age_purchase = df.groupby('Age')['Purchase'].mean().sort_values(ascending=False)
print("Average Purchase by Age Group:\n", age_purchase)

# Visualization - Avg Purchase by Age Group
plt.figure(figsize=(8,4))
sns.barplot(x='Age', y='Purchase', data=df, estimator=np.mean)
plt.title("Average Purchase by Age Group")
plt.show()

# Purchase by City Category
plt.figure(figsize=(8,4))
sns.boxplot(x='City_Category', y='Purchase', data=df)
plt.title("Purchase Distribution by City")
plt.show()

# Correlation Heatmap
corr = df.corr(numeric_only=True)
sns.heatmap(corr, annot=True, cmap='coolwarm')
plt.title("Correlation Heatmap")
plt.show()
