# B2B SaaS Pipeline Analysis
This notebook analyzes the fake B2B SaaS deals dataset.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt

# Load the dataset
df = pd.read_csv('dataset.csv')

# Convert dates to datetime
df['created_date'] = pd.to_datetime(df['created_date'])
df['closed_date'] = pd.to_datetime(df['closed_date'], errors='coerce')  # allow NULLs

# Quick look at data
df.head()

In [None]:
# Calculate sales cycle in days for closed deals
df['sales_cycle_days'] = (df['closed_date'] - df['created_date']).dt.days

# Average sales cycle by segment
avg_cycle = df.groupby('segment')['sales_cycle_days'].mean()
avg_cycle

In [None]:
# Total revenue by owner
revenue_by_owner = df.groupby('owner')['amount'].sum()
revenue_by_owner

In [None]:
# Plot deals by stage
stage_counts = df['stage'].value_counts()

plt.figure(figsize=(8,5))
stage_counts.plot(kind='bar', color='skyblue')
plt.title('Number of Deals by Stage')
plt.xlabel('Stage')
plt.ylabel('Count')
plt.show()