In [7]:
# import libraries
import numpy as np
import pandas as pd
import glob
import os

In [8]:
# read, combine, and clean csv files
attendance_dir = "Attendance Data"
files = glob.glob(os.path.join(attendance_dir, "*.csv"))
columnsNeeded = ["First Name", "Last Name", "Email", "Account Type", "Year of Graduation", "Is Member", "Degree", "Registration Date", "Checked-In Date", "Attendee's Rating", "Attendee's Feedback", "Net ID"]
df_list = []

# read files
for file in files:
    fileName = os.path.basename(file).replace(".csv", "")
    try:
        df = pd.read_csv(file, usecols=columnsNeeded) # remove unnecessary columns
    except ValueError as e: # if a column needed isn't found
        print(f"Warning: {fileName} does not contain all specified columns. Skipping missing ones.")
        df = pd.read_csv(file)
        df = df[df.columns.intersection(columnsNeeded)]

    # update individual event data after cleaning
    df.to_csv(os.path.join(attendance_dir, f"{fileName}.csv"), index=False)

    # add event name column before combining dataset
    df["Event Name"] = fileName
    df_list.append(df)

df = pd.concat(df_list, ignore_index=True)
df.to_csv("attendance2024.csv", index=False)
df.head()

Unnamed: 0,First Name,Last Name,Email,Account Type,Year of Graduation,Is Member,Degree,Registration Date,Checked-In Date,Attendee's Rating,Attendee's Feedback,Net ID,Event Name
0,Kernell,Slack,kslack@smu.edu,Undergraduate Student,2027,No,UG Cox School of Business,10/25/2024 10:22:29 AM,10/26/2024 6:07:52 PM,,,49205773@smu.edu,Boaz WP
1,ShyAnte'e,Williams,shyanteew@smu.edu,Staff,Unknown,Yes,Master's of Arts in Higher Education,10/25/2024 4:17:10 PM,10/26/2024 7:06:12 PM,,,46798462@smu.edu,Boaz WP
2,Abdulmohsen,Alkhathlan,aalkhathlan@smu.edu,Graduate Student,2025,No,Law - Masters,10/25/2024 8:44:31 PM,10/26/2024 11:35:44 PM,,,49578809@smu.edu,Boaz WP
3,Abdulmohsen,Alkhathlan,aalkhathlan@smu.edu,Graduate Student,2025,No,Law - Masters,10/25/2024 8:44:31 PM,10/26/2024 11:35:46 PM,,,49578809@smu.edu,Boaz WP
4,Abdulmohsen,Alkhathlan,aalkhathlan@smu.edu,Graduate Student,2025,No,Law - Masters,10/25/2024 8:44:31 PM,10/26/2024 11:35:47 PM,,,49578809@smu.edu,Boaz WP
