In [94]:
import pandas as pd
import numpy as np

# Load the CSV file
df = pd.read_csv('../data/results/results_chi_25.csv')

In [95]:
df.head();

In [96]:
column_name_map = {
    'paper_id': 'ID',
    'title': 'Title',
    'authors': 'Authors',
    'venue': 'Venue',
    'year': 'Year',
    'url': 'URL',
    'abstract': 'Abstract',
    'coding_task': 'Coding Task',
    'task_summary' : 'Task Summary',
    'participant_skill_level' : 'Participant Skill Level',
    'programming_language' : 'Language',
    'programming_domain' : 'Domain',
    'programming_sub_domain' : 'Sub-domain',
    'task_type' : 'Task Type',
    'code_size_scope' : 'Codebase Size',
    'evaluation_metrics' : 'Evaluation Metrics',
    'tools_environment' : 'Tools and Environment',
    'research_focus' : 'Research Focus',
    'is_programming_related' : 'Programming Related',
    'is_ai_related' : 'AI or LLM Related'
}

capitalize_list = [
    'Participant Skill Level', 'Language', 'Domain', 'Sub-domain',
    'Task Type', 'Codebase Size', 'Programming Related', 'AI or LLM Related'
]

In [97]:
def clean_author_col(df):
    authors_col = df['Authors']
    new_col = []
    for authors in authors_col:
        if not authors:
            continue
        authors = authors.strip()
        author_list = authors.split(';')

        cleaned_names = []
        for author in author_list:
            if not author:
                continue
            name_parts = author.split(',')
            if not name_parts or len(name_parts) < 2:
                continue
            first_name, last_name = name_parts[1], name_parts[0]
            cleaned_names.append(f"{first_name} {last_name}")

        new_col.append(','.join(cleaned_names))
    df['Authors'] = new_col
    return df

def clean_capitalization(df):
    for col in capitalize_list:
        df[col] = df[col].str.title()
    return df

def clean_columns(df):
    df = df.rename(columns=column_name_map)
    df = df.drop(['ID', 'Venue', 'URL'], axis=1)
    return df

In [98]:
df = clean_columns(df)
df = clean_author_col(df)
df = clean_capitalization(df)

In [99]:
print(len(df))
print(len(df[(df['Programming Related'] == 'Yes') & (df['AI or LLM Related'] == 'Yes')]))
print(len(df[(df['Programming Related'] == 'No') & (df['AI or LLM Related'] == 'No')]))
print(len(df[(df['Programming Related'] == 'Yes') & (df['AI or LLM Related'] == 'No')]))
print(len(df[(df['Programming Related'] == 'No') & (df['AI or LLM Related'] == 'Yes')]))

98
32
7
48
11


In [100]:
df[(df['Programming Related'] == 'Yes') & (df['AI or LLM Related'] == 'Yes')]

Unnamed: 0,Title,Authors,Year,Abstract,Coding Task,Task Summary,Participant Skill Level,Language,Domain,Sub-domain,Task Type,Codebase Size,Evaluation Metrics,Tools and Environment,Research Focus,Programming Related,AI or LLM Related
0,MVPrompt: Building Music-Visual Prompts for AI...,"ChungHa Lee, DaeHo Lee, Jin-Hyuk Hong",2025,,"In the user study, participants were tasked wi...",Participants refined music video scene prompts...,"Intermediate, Expert",Not Specified,Creative/Media,Generative Ai Video Production,Feature Development,Not Specified,"Quality of generated scenes, participant feedback","Gen-3 Alpha model on Runway, Zoom",Impact of stages of MVPrompt system on creativ...,Yes,Yes
2,CARING-AI: Towards Authoring Context-aware Aug...,"Jingyu Shi, Rahul Jain, Seunggeun Chi, Hyun...",2025,,"In the user study, participants were tasked wi...",Participants generated step-by-step instructio...,"Intermediate, Expert",C# (Likely For Unity Development),Human-Computer Interaction,Instructional Design,Feature Development,Function,"User satisfaction ratings, System Usability Sc...","Unity, ChatGPT",Evaluating interaction design of CARING-AI sys...,Yes,Yes
10,Prompting in the Dark: Assessing Human Perform...,"Zeyu He, Saniya Naphade, Ting-Hao Kenneth H...",2025,,"In the study, participants were tasked with us...",Participants used the PromptingSheet tool to i...,Intermediate,Not Specified,Artificial Intelligence/Ml,Natural Language Processing,Content Creation,Snippet,"Quality of labeled tweets, participant feedbac...","PromptingSheet, Zoom, Microsoft Teams",Understanding participant engagement with the ...,Yes,Yes
14,Evaluating Non-AI Experts' Interaction with AI...,"Qingxiao Zheng, Minrui Chen, Hyanghee Park,...",2025,,"In the user study, participants were tasked wi...",Participants were tasked with creating and ass...,"Beginner, Intermediate",Not Specified,Human-Computer Interaction,Conversational Agents,Feature Development,Not Specified,Qualitative assessments from think-aloud sessi...,AgentBuilder platform,Understanding challenges faced by non-AI exper...,Yes,Yes
23,Generative and Malleable User Interfaces with ...,"Yining Cao, Peiling Jiang, Haijun Xia",2025,,"In the user study, participants were tasked wi...",Participants completed two freeform tasks usin...,"Intermediate, Expert",Not Specified,Human-Computer Interaction,Ui Customization,User Interface Design,Not Specified,"5-point Likert scale questionnaire, qualitativ...",Not specified,Understanding user interaction and customizati...,Yes,Yes
27,Interactive Debugging and Steering of Multi-Ag...,"Will Epperson, Gagan Bansal, Victor C Dibia...",2025,,"In the user study, participants were tasked wi...",Participants debugged multi-agent systems usin...,"Intermediate, Expert",Not Specified,Artificial Intelligence/Ml,Debugging Ai Agents,Debugging,Not Specified,"Accuracy of final answers, qualitative analysi...",AGDebugger,Understanding developer interaction with debug...,Yes,Yes
28,Classroom Simulacra: Building Contextual Stude...,"Songlin Xu, Hao-Ning Wen, Hongyi Pan, Dalla...",2025,,"In the user study, participants were tasked wi...",Participants engaged in an online education wo...,"Beginner, Intermediate",Not Specified,Education/Learning,Online Education Systems,Data Collection,Not Specified,Quality of gaze and facial expression data col...,CogEdu system,Impact of contextual generative agents on stud...,Yes,Yes
29,AutoPBL: An LLM-powered Platform to Guide and ...,"Yihao Zhu, Zhoutong Ye, Yichen Yuan, Wenxua...",2025,,"In the study, participants were tasked with co...",Participants completed programming exercises i...,Beginner,Python,Data Science/Analytics,Machine Learning,Code Comprehension,Snippet,"Effectiveness of question types, participants'...",Jupyter Notebook,Understanding how programming tasks and reflec...,Yes,Yes
31,Canvil: Designerly Adaptation for LLM-Powered ...,"K. J. Kevin Feng, Q. Vera Liao, Ziang Xiao,...",2025,,"In the study, participants were tasked with de...",Participants designed user interfaces for a 3-...,"Intermediate, Expert",Not Specified,Human-Computer Interaction,User Interface Design,Feature Development,Not Specified,Qualitative evaluation focusing on design disc...,"Figma, videoconferencing software",Investigating collaborative dynamics in design...,Yes,Yes
33,Can AI writing be salvaged? Mitigating Idiosyn...,"Tuhin Chakrabarty, Philippe Laban, Chien-She...",2025,,"In the study, participants were tasked with ed...",Participants edited and annotated problematic ...,Expert,Not Specified,Artificial Intelligence/Ml,Natural Language Processing,Feature Development,Not Specified,"Number of edits completed, diversity of catego...",Editing interface designed for annotation process,Understanding how creative writers interact wi...,Yes,Yes
