In [9]:
import pandas as pd

In [10]:
# Load Excel file
df = pd.read_excel("newform.xlsx")

In [11]:
# Remove leading and trailing spaces from column names
df.columns = df.columns.str.strip()

In [12]:
# Select columns with answers to questions. Make sure these match the Excel columns exactly.
answer_columns = [
    "What type of visualizations are you most interested in creating?",
    "How often do you work with data from multiple sources?",
    "Do you need to create custom calculations or metrics?",
    "How comfortable are you with writing DAX formulas?",
    "Do you use or plan to use Power Query for data transformation?",
    "Are you interested in automating data refresh and report updates?",
    "Do you need to drill through reports to get detailed data views?",
    "How important is data modeling for your projects?",
    "Will you be sharing your reports with external stakeholders?",
    "Do you need to work on real-time data analytics?",
    "Are you interested in mobile accessibility for your reports?",
    "How do you plan to manage data security in Power BI?",
    "Do you use or plan to use AI features in Power BI?",
    "Do you need to perform trend analysis in your reports?",
    "How comfortable are you with using the 'Bookmarks' feature?",
    "Do you plan to use custom themes for your reports?",
    "How familiar are you with the Q&A feature in Power BI?",
    "Are you interested in using the Power BI API for custom solutions?",
    "Do you need to export data from Power BI to other formats?",
    "How do you plan to collaborate with others on Power BI projects?"
]

In [13]:
# Initialize two empty lists to store the categories and recommended courses
categories = []
recommended_courses = []
Paid_Courses = []

In [14]:
# Loop through each row in the DataFrame
for index, row in df.iterrows():
    score = 0

    # Iterate through each question to calculate the score
    for question in answer_columns:
        answer = row[question]
        if answer in ["Always", "Yes, complex metrics involving multiple tables", "Advanced level", "Critical", "All the time", "Yes, advanced AI features", "Advanced", "Yes", "Using both shared reports and workspaces"]:
            score += 3
        elif answer in ["Often", "Yes, including time-based metrics", "Intermediate level", "Very Important", "Frequently", "Yes, some basic AI features", "Intermediate", "Possibly", "Using Power BI workspaces"]:
            score += 2
        else:
            score += 1

    # Categorize the respondents based on their scores and recommend courses
    if score <= 20:
        categories.append("Beginner's Training")
        recommended_courses.append('LinkedIn Learning: "Power BI Essential Training"')
        Paid_Courses.append('Udemy: "Microsoft Power BI: A Complete Introduction"')
    elif score <= 26:
        categories.append('Intermediate Training')
        recommended_courses.append('LinkedIn Learning: "Advanced Power BI"')
        Paid_Courses.append('Udemy: "Microsoft Power BI - Data Modeling and DAX Formulas"')
    else:
        categories.append('Advanced Training')
        recommended_courses.append('LinkedIn Learning: "Power BI Data Methods"')
        Paid_Courses.append('Udemy: "Advanced Microsoft Power BI"')

In [15]:
# Add the categories and recommended courses as new columns to the DataFrame
df['Training Level'] = categories
df['Recommended Course'] = recommended_courses
df['Paid Course'] = Paid_Courses

In [16]:
# Save the DataFrame back to Excel
df.to_excel("categorized_training_needs_with_courses.xlsx", index=False)