In [7]:
import pandas as pd
import plotly.express as px

# Load the dataset
df = pd.read_excel('Final Lead Data.xlsx')

# Drop duplicates based on 'Email'
df = df.drop_duplicates(subset='Email', keep='first')

# Combine 'Branch/ Specialisation' and 'Other Branch' into 'Branch' and drop the original columns
df['Branch'] = df['Branch/ Specialisation'].fillna('') + ' ' + df['Other Branch'].fillna('')
df = df.drop(['Branch/ Specialisation', 'Other Branch'], axis=1)

# Combine 'New College Name' and 'Colleges' into 'College' and drop the original columns
df['College'] = df['Colleges'].fillna('') + ' ' + df['New College Name'].fillna('')
df = df.drop(['Colleges', 'New College Name'], axis=1)

# Visualizations using Plotly Express
fig_gender = px.bar(x=df['Gender'].value_counts().index, y=df['Gender'].value_counts().values,
                    labels={'x': 'Gender', 'y': 'Count'},
                    title='Count of Attendees by Gender')
fig_city = px.bar(x=df['City'].value_counts().index, y=df['City'].value_counts().values,
                  labels={'x': 'City', 'y': 'Count'},
                  title='Count of Attendees by City')
fig_branch = px.bar(x=df['Branch'].value_counts().index, y=df['Branch'].value_counts().values,
                    labels={'x': 'Branch', 'y': 'Count'},
                    title='Count of Attendees by Branch')

# Show the plots
fig_gender.show()
fig_city.show()
fig_branch.show()

# Data preparation for graduation year prediction
df['Academic Year'] = df['Academic Year'].fillna(0).astype(int)
df['Year'] = pd.to_datetime(df['Created']).dt.year
df['Year of Graduation'] = df.apply(lambda row: row['Year'] + (4 - row['Academic Year']) if row['Academic Year'] != 0 else '', axis=1)

# Save to files
df.to_excel('Predicted Year of Graduation.xlsx', index=False)
df.to_csv('Predicted Year of Graduation.csv', index=False)



Could not infer format, so each element will be parsed individually, falling back to `dateutil`. To ensure parsing is consistent and as-expected, please specify a format.

