## Clean Up : School Demographic Info (schools.csv)


In [3]:
%matplotlib inline
import numpy as np
import scipy as sp
import matplotlib as mpl
import matplotlib.cm as cm
import matplotlib.pyplot as plt
import pandas as pd
pd.set_option('display.width', 500)
pd.set_option('display.max_columns', 100)
pd.set_option('display.notebook_repr_html', True)
import seaborn as sns
sns.set_style("whitegrid")
sns.set_context("poster")

In [12]:
# Load schools.csv (raw data)
sdf_v0  = pd.read_csv("tempdata/schools.csv")
sdf_v0.shape


(99074, 355)

In [7]:
'''
●      Key for missing/NA/etc:
○      † indicates that the data are not applicable.
○      – indicates that the data are missing.
○      ‡ indicates that the data do not meet NCES data quality standards.
○       There are some escapes off quotes “”
'''
sc_drdf = pd.read_csv("tempdata/schools_rc.csv") # schools.csv column [d]rop [r]ename
sdf_v1  = sdf_v0.copy(deep=True)


In [9]:
for index, row in sc_drdf.iterrows():
    current_colname = str(row['Raw Column Name'])
    new_colname     = str(row['New Column Name'])
    if new_colname == "drop":
        #print "Dropping : ", current_colname
        sdf_v1.drop(current_colname, axis=1, inplace=True)
    else :
        #print "Renaming : ", current_colname, " --> ", new_colname
        sdf_v1.rename(columns={current_colname : new_colname    }, inplace=True)

sdf_v1.shape    

(99074, 335)

##### School Demographics : Column Notations 

| Notation       | Description                              |
| :------------- | ---------------------------------------- |
| pk             | School Year : Prekindergarten            |
| k              | School Year : Kindergarten               |
| g (g1,g2… g12) | School Year : Grade (Grade1, Grade2… Grade12) |
| ug             | School Year : Ungraded                   |
| an             | Race : American Indian/Asian Native      |
| a              | Race : Asian/Pacific Islander            |
| h              | Race : Hispanic                          |
| b              | Race : Black                             |
| w              | Race : White                             |
| hp             | Race : Hawaiian Native/Pacific Islander  |
| mr             | Race : Two or more races                 |
| m              | Sex : Male                               |
| f              | Sex : Female                             |



In [10]:
sdf_v1.head()

Unnamed: 0,﻿School Name,state,state_abbr,school_id_nces,agency_name,agency_id_nces,county,data_available,data_na,city,zipcode,school_type,agency_type,operational,charter_school,magnet_school,shared_time_school,location_type,title1_school_wide,title1_eligible,title1_status,latitude,longitude,school_id_state,agency_id_state,congressional_code,virtual_school,lunch_program,charter_primary,charter_secondary,offered_g_lowest,offered_g_highest,offered_pk,offered_k,offered_g1,offered_g2,offered_g3,offered_g4,offered_g5,offered_g6,offered_g7,offered_g8,offered_g9,offered_g10,offered_g11,offered_g12,offered_ug,total_students,lunch_free_eligible,lunch_reduced_eligible,...,g10_w_m,g10_w_f,g10_hp_m,g10_hp_f,g10_mr_m,g10_mr_f,g11_an_m,g11_an_f,g11_a_m,g11_a_f,g11_h_m,g11_h_f,g11_b_m,g11_b_f,g11_w_m,g11_w_f,g11_hp_m,g11_hp_f,g11_mr_m,g11_mr_f,g12_an_m,g12_an_f,g12_a_m,g12_a_f,g12_h_m,g12_h_f,g12_b_m,g12_b_f,g12_w_m,g12_w_f,g12_hp_m,g12_hp_f,g12_mr_m,g12_mr_f,gug_an_m,gug_an_f,gug_a_m,gug_a_f,gug_h_m,gug_h_f,gug_b_m,gug_b_f,gug_w_m,gug_w_f,gug_hp_m,gug_hp_f,gug_mr_m,gug_mr_f,teacher_fulltime,pupil_teacher_ratio
0,"EDWARD ""DUKE"" ELLINGTON @ BECKHAM",Michigan,MI,261200004838,DETROIT CITY SCHOOL DISTRICT,2612000,WAYNE COUNTY,1986-2013,–,DETROIT,48213,1-Regular school,1-Local school district,1-Currently operational,2-No,2-No,2-No,11-City: Large,1-Yes,1-Yes,5-Eligible for Title I SWP provides SWP program,42.4084,-82.9786,"=""03737""",82010,2614,Not a virtual school,Yes under Community Eligibility Option (CEO),†,†,Prekindergarten,8th Grade,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,2-No,2-No,2-No,2-No,1-Yes,697,609,0,...,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,0,0,0,0,0,0,0,0,0,0,0,0,0,0,41.0,17.0
1,"J.M. ""CHICK"" BUCKBEE JUVENILE CENTER",West Virginia,WV,540051101159,INSTITUTIONAL EDUCATIONAL PROGRAMS,5400511,HAMPSHIRE COUNTY,2003-2013,1986-2002,AUGUSTA,26704,4-Alternative/other school,5-State-operated institution,1-Currently operational,†,†,2-No,42-Rural: Distant,†,2-No,6-Not eligible for either TAS or SWP,39.3013,-78.6464,34126,3400000,5402,Not a virtual school,Yes participating without using any Provision ...,†,†,7th Grade,12th Grade,2-No,2-No,2-No,2-No,2-No,2-No,2-No,2-No,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,2-No,15,12,0,...,3,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,1,0,1,0,2,0,0,0,0,0,†,†,†,†,†,†,†,†,†,†,†,†,†,†,2.0,7.5
2,"JAMES H. ""TIGER"" MORTON JUVENILE CENTER",West Virginia,WV,540051101146,INSTITUTIONAL EDUCATIONAL PROGRAMS,5400511,KANAWHA COUNTY,2003-2013,1986-2002,DUNBAR,25064,4-Alternative/other school,5-State-operated institution,1-Currently operational,†,†,2-No,41-Rural: Fringe,†,2-No,6-Not eligible for either TAS or SWP,38.3747,-81.76,34125,3400000,5402,Not a virtual school,Yes participating without using any Provision ...,†,†,7th Grade,12th Grade,2-No,2-No,2-No,2-No,2-No,2-No,2-No,2-No,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,2-No,17,14,0,...,2,2,0,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,1,4,0,0,0,0,0,†,†,†,†,†,†,†,†,†,†,†,†,†,†,2.0,8.5
3,"MARY HARRIS ""MOTHER"" JONES ELEMENTARY",Maryland,MD,240051001257,PRINCE GEORGE'S COUNTY PUBLIC SCHOOLS,2400510,PRINCE GEORGE'S COUNTY,2002-2013,1986-2001,ADELPHI,20783,1-Regular school,1-Local school district,1-Currently operational,2-No,2-No,2-No,21-Suburb: Large,1-Yes,1-Yes,5-Eligible for Title I SWP provides SWP program,38.9999,-76.9661,161730,16,2404,Not a virtual school,Yes participating without using any Provision ...,†,†,Prekindergarten,6th Grade,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,2-No,2-No,2-No,2-No,2-No,2-No,2-No,1029,856,83,...,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,69.01,14.91
4,"PEMAYETV EMAHAKV CHARTER ""OUR WAY SCHOOL""",Florida,FL,120066004849,GLADES,1200660,GLADES COUNTY,2006-2013,1986-2005,OKEECHOBEE,34974,1-Regular school,1-Local school district,1-Currently operational,1-Yes,2-No,2-No,43-Rural: Remote,†,2-No,6-Not eligible for either TAS or SWP,27.0856,-81.0805,"=""0056""",22,1217,Not a virtual school,No,1200660,–,Kindergarten,5th Grade,2-No,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,1-Yes,2-No,2-No,2-No,2-No,2-No,2-No,2-No,2-No,175,0,0,...,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,†,29.0,6.03


In [11]:
sdf_v1.to_csv("tempdata/schools_v1.csv")