## Prep

In [1]:
import os
import sys
import json
import pandas as pd
from IPython.display import display, HTML
import matplotlib.pyplot as plt
import seaborn as sns

# ------------------------------------------------------------------
# 1. Make sure Python can find your agent package / module
#    (adapt the path if your repo layout is different)
# ------------------------------------------------------------------
ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath("__file__")))
sys.path.append(ROOT_DIR)

## GPT-4o, without prompting domain

In [2]:
from agents.d2insight_gpt4o import analyze_csv_with_insights   # noqa: E402

if __name__ == "__main__":
    csv_file = "https://drive.google.com/uc?export=download&id=1JhsgpIulCv8Q9NPTZGhrz5-y_RUufMoO"      # path to your CSV
    question = "analysis this file with insights."
    print(analyze_csv_with_insights(csv_file, question))




{
  "dataset_overview": {
    "total_records": 15,
    "columns": [
      "Current Period",
      "Customer ID",
      "Periods Active",
      "Current Customer (Y/N)",
      "Period Acquired",
      "Period Terminated",
      "Acquisition Channel",
      "Sector",
      "Referred (Y/N)",
      "Premium (Y/N)",
      "Region",
      "Co. Age",
      "Size",
      "No. Maker Contracts",
      "No. Advanced Contracts",
      "Revenue, Total",
      "Maker Revenue",
      "Advanced Revenue",
      "Expected CLV"
    ]
  },
  "key_insights": {
    "customer_status": {
      "current_customers": 1,
      "terminated_customers": 14
    },
    "acquisition_channel": {
      "external": 11,
      "internal": 4
    },
    "sector": {
      "aerospace": 15
    },
    "region_distribution": {
      "southeast": 3,
      "northeast": 5,
      "midwest": 4,
      "west": 3
    },
    "company_age_distribution": {
      "0-5yrs": 8,
      "6-10yrs": 4,
      "10+yrs": 3
    },
    "size_distribution

In [3]:
import json

result = analyze_csv_with_insights(csv_file, question)

# Save the result to a JSON file\n",
with open("exp01_d2insight_gpt4o_stimhartnow_result.json", "w") as f:
    json.dump(json.loads(result), f, indent=2)



## GPT-4o, with prompting domain

In [4]:
from agents.d2insight_gpt4o_domain import analyze_csv_with_insights_domain   # noqa: E402

if __name__ == "__main__":
    csv_file = "https://drive.google.com/uc?export=download&id=1JhsgpIulCv8Q9NPTZGhrz5-y_RUufMoO"      # path to your CSV
    question = "analysis this file with insights."
    print(analyze_csv_with_insights_domain(csv_file, question))

{
  "domain": "Customer Relationship Management (CRM) in the Aerospace Sector",
  "insights": {
    "customer_retention": {
      "current_customers": 1,
      "terminated_customers": 14,
      "retention_rate": "6.67%",
      "observation": "The majority of customers have terminated their contracts, indicating potential issues with customer retention strategies."
    },
    "acquisition_channels": {
      "external_acquisitions": 11,
      "internal_acquisitions": 4,
      "observation": "Most customers were acquired through external channels, suggesting a reliance on external marketing or partnerships for customer acquisition."
    },
    "customer_demographics": {
      "region_distribution": {
        "Northeast": 5,
        "Southeast": 3,
        "Midwest": 4,
        "West": 3
      },
      "company_age_distribution": {
        "0-5yrs": 8,
        "6-10yrs": 4,
        "10+yrs": 3
      },
      "size_distribution": {
        "Small": 10,
        "Medium": 5,
        "Large": 

In [5]:
import json

result_domain = analyze_csv_with_insights_domain(csv_file, question)

# Save the result to a JSON file\n",
with open("exp01_d2insight_gpt4o-domain_stimhartnow_output.json", "w") as f:
    json.dump(json.loads(result_domain), f, indent=2)