# AI-Enhanced Lead Prioritization
This notebook demonstrates an AI-based lead scoring feature. We simulate a small B2B leads dataset and use a logistic regression model to predict which leads are most likely to convert.

In [None]:
import pandas as pd
from sklearn.linear_model import LogisticRegression
from sklearn.preprocessing import OneHotEncoder
from sklearn.compose import ColumnTransformer
import numpy as np

data = [
    {'Company': 'AlphaTech', 'Industry': 'Technology', 'CompanySize': 'Large', 'NumEmployees': 1000,
     'AnnualRevenue': 500.0, 'WebsiteVisits': 1000, 'EmailOpens': 300, 'Qualified': 1},
    {'Company': 'BetaFinance', 'Industry': 'Finance', 'CompanySize': 'Medium', 'NumEmployees': 200,
     'AnnualRevenue': 150.0, 'WebsiteVisits': 400, 'EmailOpens': 80, 'Qualified': 1},
    {'Company': 'GammaHealth', 'Industry': 'Healthcare', 'CompanySize': 'Large', 'NumEmployees': 1200,
     'AnnualRevenue': 550.0, 'WebsiteVisits': 800, 'EmailOpens': 200, 'Qualified': 1},
    {'Company': 'DeltaTech', 'Industry': 'Technology', 'CompanySize': 'Small', 'NumEmployees': 50,
     'AnnualRevenue': 20.0,  'WebsiteVisits': 100, 'EmailOpens': 20, 'Qualified': 0},
    {'Company': 'EpsilonFinance', 'Industry': 'Finance', 'CompanySize': 'Small', 'NumEmployees': 30,
     'AnnualRevenue': 5.0,   'WebsiteVisits': 50,  'EmailOpens': 5,  'Qualified': 0}
]
df = pd.DataFrame(data)
X = df[['Industry','CompanySize','NumEmployees','AnnualRevenue','WebsiteVisits','EmailOpens']]
y = df['Qualified']
ct = ColumnTransformer([('ohe', OneHotEncoder(), ['Industry','CompanySize'])], remainder='passthrough')
X_transformed = ct.fit_transform(X)
model = LogisticRegression()
model.fit(X_transformed, y)
probs = model.predict_proba(X_transformed)[:,1]
df['Score'] = np.round(probs, 3)
df_sorted = df.sort_values('Score', ascending=False)
df_sorted[['Company','Score','Qualified']]