In [None]:
# Imports and Setup
# ===========================
import pandas as pd
from transformers import pipeline
import sys
from IPython.display import display, Markdown

# Add the 'src' directory to the Python path to allow importing our engine
sys.path.append('../')
from src.analytics_engine import calculate_vendor_metrics, create_lending_score

In [None]:
# Load Model and Data
# ===========================
print("Loading NER model pipeline...")
# IMPORTANT: Hugging Face model ID
model_id = "abeni505/results"
ner_pipeline = pipeline("ner", model=model_id)

print("Loading scraped Telegram data...")
df = pd.read_csv('../data/scraped_telegram_data.csv')
df.dropna(subset=['views', 'date'], inplace=True)
print(f"Loaded {len(df)} messages with complete metadata.")


In [None]:
#Run the Analytics Engine
# ================================
# This step can take some time as it runs the NER model over many posts.
# The progress bar from tqdm will show its progress.
vendor_scorecard = calculate_vendor_metrics(df, ner_pipeline)
final_scorecard = create_lending_score(vendor_scorecard)

In [None]:
# Display the Final Vendor Scorecard
# ==========================================
Markdown("# EthioMart FinTech Vendor Scorecard")
Markdown("""
This table ranks vendors based on their potential as candidates for micro-lending. The **Lending Score** is a composite metric calculated from a vendor's market reach (`Avg. Views/Post`) and their business consistency (`Posts/Week`). A higher score indicates a more active and visible vendor.
""")
display(final_scorecard.round(2))