# File containing code to separate teaching staff data

In [1]:
# Dependencies
import pandas as pd
import os

In [2]:
# Read in data
df = pd.read_csv("../data/raw/C-2015-DCF-Block_2C-Teaching_Staff_Summary-2015.csv", index_col=False)

In [3]:
# Drop unnecessary data
df = df.drop(columns=["survey_year"])

In [4]:
# Set cells with NA to 0
df = df.fillna(0)

In [5]:
# Separate data based on designation
prof1 = df[ df["designation"] == "Additional Professor" ]
prof2 = df[ df["designation"] == "Assistant Professor" ]
prof3 = df[ df["designation"] == "Associate Professor" ]

In [6]:
lecturer1 = df[ df["designation"] == "Lecturer" ]
lecturer2 = df[ df["designation"] == "Lecturer (Selection Grade)" ]
lecturer3 = df[ df["designation"] == "Lecturer (Senior Scale)" ]

In [7]:
teacher1 = df[ df["designation"] == "Contract Teacher" ]
teacher2 = df[ df["designation"] == "Temporary Teacher" ]
teacher3 = df[ df["designation"] == "Visiting Teacher" ]

In [8]:
# Concat all professor data to a single dataframe
prof = pd.concat([prof1, prof2, prof3])

In [9]:
# Concat all lecturer data to a single dataframe
lecturer = pd.concat([lecturer1, lecturer2, lecturer3])

In [10]:
# Concat all teacher data to a single dataframe
teacher = pd.concat([teacher1, teacher2, teacher3])

In [11]:
# Calculate total number of professors in each institution
prof = prof.groupby(by=["id", "institution_name"]).sum()
# Calculate total number of professors in each institution
lecturer = lecturer.groupby(by=["id", "institution_name"]).sum()
# Calculate total number of teachers in each institution
teacher = teacher.groupby(by=["id", "institution_name"]).sum()

In [12]:
# Check if processed directory exists
if not os.path.exists("../data/processed"):
    # Create directory
    os.mkdir("../data/processed")
# Check if processed directory exists
if not os.path.exists("../data/processed/teachingStaff"):
    # Create directory
    os.mkdir("../data/processed/teachingStaff")

In [13]:
# Write data to file
prof.to_csv("../data/processed/teachingStaff/college_professor_data.csv")
lecturer.to_csv("../data/processed/teachingStaff/college_lecturer_data.csv")
teacher.to_csv("../data/processed/teachingStaff/college_teacher_data.csv")