# File containing code to separate enrollment data based on level

In [1]:
# Dependencies
import pandas as pd
import os

In [2]:
# Read data
df = pd.read_csv("../data/raw/C-2015-DCF-Block_2D-Student_enrollment_for_Regular_Courses-2015.csv", index_col=False)
# Set empty cells to 0
df = df.fillna(0)

In [3]:
# Aggregate male and female enrollments
df["total_enrollment"] = df["total_total_persons"] + df["pwd_total_persons"] + df["muslim_minority_total_persons"] + df["other_minority_total_persons"]
df["total_female_enrollment"] = df["total_total_females"] + df["pwd_total_females"] + df["muslim_minority_total_females"] + df["other_minority_total_females"]
df["total_male_enrollment"] = df["total_enrollment"] - df["total_female_enrollment"]

In [4]:
# Select required columns
df = df[ ["College_id", "College_name", "total_enrollment", "total_female_enrollment", "total_male_enrollment", "levell"] ]

In [5]:
# Separate data based on level
pg = df[df["levell"] == "Post Graduate"].groupby(by=["College_id", "College_name"]).sum()
phd = df[df["levell"] == "Ph.D."].groupby(by=["College_id", "College_name"]).sum()
pgd = df[df["levell"] == "PG Diploma"].groupby(by=["College_id", "College_name"]).sum()
mphil = df[df["levell"] == "M.Phil."].groupby(by=["College_id", "College_name"]).sum()
integrated = df[df["levell"] == "Integrated"].groupby(by=["College_id", "College_name"]).sum()
diploma = df[df["levell"] == "Diploma"].groupby(by=["College_id", "College_name"]).sum()
certificate = df[df["levell"] == "Certificate"].groupby(by=["College_id", "College_name"]).sum()
ug = df[df["levell"] == "Under Graduate"].groupby(by=["College_id", "College_name"]).sum()

In [6]:
# Check if processed directory exists
if not os.path.exists("../data/processed"):
    # Create directory
    os.mkdir("../data/processed")
# Check if results directory exists
if not os.path.exists("../data/processed/enrollments"):
    # Create directory
    os.mkdir("../data/processed/enrollments")

In [7]:
# Write data to file
pg.to_csv("../data/processed/enrollments/pg_enrollemnts.csv")
phd.to_csv("../data/processed/enrollments/phd_enrollemnts.csv")
pgd.to_csv("../data/processed/enrollments/pgd_enrollemnts.csv")
mphil.to_csv("../data/processed/enrollments/mphil_enrollemnts.csv")
integrated.to_csv("../data/processed/enrollments/integrated_enrollemnts.csv")
diploma.to_csv("../data/processed/enrollments/diploma_enrollemnts.csv")
certificate.to_csv("../data/processed/enrollments/certificate_enrollemnts.csv")
ug.to_csv("../data/processed/enrollments/ug_enrollemnts.csv")