In [1]:
import pandas as pd
college = pd.read_csv('C:\Anaconda\data\college.csv', index_col='INSTNM') 

In [2]:
'''
To successfully use an operator with a DataFrame, first select homogeneous data. For this
recipe, we will select all the columns that begin with UGDS_. These columns represent the
fraction of undergraduate students by race. To get started, we import the data and use the
institution name as the label for our index, and then select the columns we desire with the
filter method:'''
college_ugds_ = college.filter(like='UGDS_')
college_ugds_.head()

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,0.0333,0.9353,0.0055,0.0019,0.0024,0.0019,0.0,0.0059,0.0138
University of Alabama at Birmingham,0.5922,0.26,0.0283,0.0518,0.0022,0.0007,0.0368,0.0179,0.01
Amridge University,0.299,0.4192,0.0069,0.0034,0.0,0.0,0.0,0.0,0.2715
University of Alabama in Huntsville,0.6988,0.1255,0.0382,0.0376,0.0143,0.0002,0.0172,0.0332,0.035
Alabama State University,0.0158,0.9208,0.0121,0.0019,0.001,0.0006,0.0098,0.0243,0.0137


In [3]:
'''Mathematically, adding .005 should be enough so that the floor division in the next step
correctly rounds to the nearest whole percentage. The trouble appears because of the
inexactness of floating point numbers:
>>> .045 + .005
0.049999999999999996
There is an extra .00001 added to each number to ensure that the floating point
representation has the first four digits the same as the actual value. This works because the
maximum precision of all the points in the dataset is four decimal places.'''

college_ugds_ + .00501
# Use the floor division operator, //, to round to the nearest whole number percentage:
(college_ugds_ + .00501) // .01


Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,3.0,94.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0
University of Alabama at Birmingham,59.0,26.0,3.0,5.0,0.0,0.0,4.0,2.0,1.0
Amridge University,30.0,42.0,1.0,0.0,0.0,0.0,0.0,0.0,27.0
University of Alabama in Huntsville,70.0,13.0,4.0,4.0,1.0,0.0,2.0,3.0,4.0
Alabama State University,2.0,92.0,1.0,0.0,0.0,0.0,1.0,2.0,1.0
The University of Alabama,78.0,11.0,3.0,1.0,0.0,0.0,3.0,3.0,0.0
Central Alabama Community College,73.0,26.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
Athens State University,78.0,12.0,2.0,1.0,2.0,0.0,2.0,1.0,3.0
Auburn University at Montgomery,53.0,34.0,1.0,2.0,0.0,0.0,3.0,4.0,2.0
Auburn University,85.0,7.0,2.0,2.0,1.0,0.0,0.0,1.0,1.0


In [4]:
'''we reproduce the previous steps with the round method. Before we can do this,
we must again add an extra .00001 to each DataFrame value for a different reason from
step 1. NumPy and Python 3 round numbers that are exactly halfway between either side to
the even number.
'''
college_ugds_op_round = (college_ugds_ + .00501) // .01 / 100
college_ugds_op_round.head()

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,0.03,0.94,0.01,0.0,0.0,0.0,0.0,0.01,0.01
University of Alabama at Birmingham,0.59,0.26,0.03,0.05,0.0,0.0,0.04,0.02,0.01
Amridge University,0.3,0.42,0.01,0.0,0.0,0.0,0.0,0.0,0.27
University of Alabama in Huntsville,0.7,0.13,0.04,0.04,0.01,0.0,0.02,0.03,0.04
Alabama State University,0.02,0.92,0.01,0.0,0.0,0.0,0.01,0.02,0.01


In [5]:
'''Now use the round DataFrame method to do the rounding automatically for us.
NumPy rounds numbers that are exactly halfway between either side to the even
side. Due to this, we add a small fraction before rounding:'''
college_ugds_round = (college_ugds_ + .00001).round(2)

In [6]:
#Use the equals DataFrame method to test the equality of two DataFrames:
college_ugds_op_round.equals(college_ugds_round)

True

In [7]:
'''
Just as with Series, DataFrames have method equivalents of the operators. You may replace
the operators with their method equivalents:
college_ugds_op_round_methods = college_ugds_.add(.00501) \
.floordiv(.01) \
.div(100)
college_ugds_op_round_methods.equals(college_ugds_op_round)'''

'\nJust as with Series, DataFrames have method equivalents of the operators. You may replace\nthe operators with their method equivalents:\ncollege_ugds_op_round_methods = college_ugds_.add(.00501) .floordiv(.01) .div(100)\ncollege_ugds_op_round_methods.equals(college_ugds_op_round)'

In [8]:
'''Comparing missing values
Pandas uses the NumPy NaN (np.nan) object to represent a missing value. This is an
unusual object, as it is not equal to itself. Even Python's None object evaluates as True when
compared to itself:
All other comparisons against np.nan also return False, except not equal to:
SQL-ben is ez a NULL értékek működése.
'''
import numpy as np
print(np.nan == np.nan)

print(np.nan > 5)

print(5 > np.nan)

print(np.nan != 5)


False
False
False
True


In [9]:
'''Series and DataFrames use the equals operator, ==, to make element-by-element
comparisons that return an object of the same size.
'''
college = pd.read_csv('C:\Anaconda\data\college.csv', index_col='INSTNM')
college_ugds_ = college.filter(like='UGDS_')

In [10]:
# To get an idea of how the equals operator works, let's compare each element to a scalar value:
college_ugds_ == .0019

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,False,False,False,True,False,True,False,False,False
University of Alabama at Birmingham,False,False,False,False,False,False,False,False,False
Amridge University,False,False,False,False,False,False,False,False,False
University of Alabama in Huntsville,False,False,False,False,False,False,False,False,False
Alabama State University,False,False,False,True,False,False,False,False,False
The University of Alabama,False,False,False,False,False,False,False,False,False
Central Alabama Community College,False,False,False,False,False,False,False,False,True
Athens State University,False,False,False,False,False,False,False,False,False
Auburn University at Montgomery,False,False,False,False,False,False,False,False,False
Auburn University,False,False,False,False,False,False,False,False,False


In [11]:
college_self_compare = college_ugds_ == college_ugds_
college_self_compare.head()

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,True,True,True,True,True,True,True,True,True
University of Alabama at Birmingham,True,True,True,True,True,True,True,True,True
Amridge University,True,True,True,True,True,True,True,True,True
University of Alabama in Huntsville,True,True,True,True,True,True,True,True,True
Alabama State University,True,True,True,True,True,True,True,True,True


In [12]:
# Using the all method to determine if each column contains only True values yields an unexpected result:
college_self_compare.all()

UGDS_WHITE    False
UGDS_BLACK    False
UGDS_HISP     False
UGDS_ASIAN    False
UGDS_AIAN     False
UGDS_NHPI     False
UGDS_2MOR     False
UGDS_NRA      False
UGDS_UNKN     False
dtype: bool

In [13]:
# The primary way to count missing values uses the isnull method:
college_ugds_.isnull().sum()

UGDS_WHITE    661
UGDS_BLACK    661
UGDS_HISP     661
UGDS_ASIAN    661
UGDS_AIAN     661
UGDS_NHPI     661
UGDS_2MOR     661
UGDS_NRA      661
UGDS_UNKN     661
dtype: int64

In [14]:
'''The correct way to compare two entire DataFrames with one another is not with
the equals operator but with the equals method:'''
college_ugds_.equals(college_ugds_)

True

In [15]:
#Transposing the direction of a DataFrame operation
'''Many DataFrame methods have an axis parameter. This important parameter controls the
direction in which the operation takes place. Axis parameters can only be one of two values,
either 0 or 1, and are aliased respectively as the strings index and columns.
Nearly all DataFrame methods default the axis parameter to 0/index.  '''

'Many DataFrame methods have an axis parameter. This important parameter controls the\ndirection in which the operation takes place. Axis parameters can only be one of two values,\neither 0 or 1, and are aliased respectively as the strings index and columns.\nNearly all DataFrame methods default the axis parameter to 0/index.  '

In [16]:
college = pd.read_csv('C:\Anaconda\data\college.csv', index_col='INSTNM')
college_ugds_ = college.filter(like='UGDS_')
college_ugds_.head()

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,0.0333,0.9353,0.0055,0.0019,0.0024,0.0019,0.0,0.0059,0.0138
University of Alabama at Birmingham,0.5922,0.26,0.0283,0.0518,0.0022,0.0007,0.0368,0.0179,0.01
Amridge University,0.299,0.4192,0.0069,0.0034,0.0,0.0,0.0,0.0,0.2715
University of Alabama in Huntsville,0.6988,0.1255,0.0382,0.0376,0.0143,0.0002,0.0172,0.0332,0.035
Alabama State University,0.0158,0.9208,0.0121,0.0019,0.001,0.0006,0.0098,0.0243,0.0137


In [17]:
# The count method returns the number of non-missing values. By default, its axis parameter is set to 0:
college_ugds_.count()

UGDS_WHITE    6874
UGDS_BLACK    6874
UGDS_HISP     6874
UGDS_ASIAN    6874
UGDS_AIAN     6874
UGDS_NHPI     6874
UGDS_2MOR     6874
UGDS_NRA      6874
UGDS_UNKN     6874
dtype: int64

In [18]:
'''Changing the axis parameter to 1/columns transposes the operation so that each
row of data has a count of its non-missing values:'''
college_ugds_.count(axis='columns').head()
# Ez így nem értékes, mert csak azt mondja meg, hogy hány oszlop van.

INSTNM
Alabama A & M University               9
University of Alabama at Birmingham    9
Amridge University                     9
University of Alabama in Huntsville    9
Alabama State University               9
dtype: int64

In [19]:
#Each row of percentages should add up to 1. The sum method may be used to verify this:
college_ugds_.sum(axis='columns').head()

INSTNM
Alabama A & M University               1.0000
University of Alabama at Birmingham    0.9999
Amridge University                     1.0000
University of Alabama in Huntsville    1.0000
Alabama State University               1.0000
dtype: float64

In [20]:
# To get an idea of the distribution of each column, the median method can be used:
college_ugds_.median(axis='index')

UGDS_WHITE    0.55570
UGDS_BLACK    0.10005
UGDS_HISP     0.07140
UGDS_ASIAN    0.01290
UGDS_AIAN     0.00260
UGDS_NHPI     0.00000
UGDS_2MOR     0.01750
UGDS_NRA      0.00000
UGDS_UNKN     0.01430
dtype: float64

In [21]:
college_ugds_.median(axis='columns').head()

INSTNM
Alabama A & M University               0.0055
University of Alabama at Birmingham    0.0283
Amridge University                     0.0034
University of Alabama in Huntsville    0.0350
Alabama State University               0.0121
dtype: float64

In [22]:
'''
The cumsum method with axis=1 accumulates the race percentages across each row. It
gives a slightly different view of the data. For example, it is very easy to see the exact
percentage of white, black, and Hispanic together for each school:'''
  # Tehát a következő esetünkben balról jobbra kumulálunk. Ennek van értelme, soronként jelen esetben nem lenne.
college_ugds_cumsum = college_ugds_.cumsum(axis=1)
college_ugds_cumsum.head()

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,0.0333,0.9686,0.9741,0.976,0.9784,0.9803,0.9803,0.9862,1.0
University of Alabama at Birmingham,0.5922,0.8522,0.8805,0.9323,0.9345,0.9352,0.972,0.9899,0.9999
Amridge University,0.299,0.7182,0.7251,0.7285,0.7285,0.7285,0.7285,0.7285,1.0
University of Alabama in Huntsville,0.6988,0.8243,0.8625,0.9001,0.9144,0.9146,0.9318,0.965,1.0
Alabama State University,0.0158,0.9366,0.9487,0.9506,0.9516,0.9522,0.962,0.9863,1.0


In [23]:
# Determining college campus diversity
# És így hivatkozunk GitHub tartalomra.
# Ez a forrásfile az eredmény lesz, ezt fogjuk előállítani a következő lépésekben:
collegediv = pd.read_csv('https://raw.githubusercontent.com/DatasRev/source-files/master/csv/college_diversity.csv', index_col='School')
collegediv.head()

Unnamed: 0_level_0,Diversity Index
School,Unnamed: 1_level_1
"Rutgers University--Newark Newark, NJ",0.76
"Andrews University Berrien Springs, MI",0.74
"Stanford University Stanford, CA",0.74
"University of Houston Houston, TX",0.74
"University of Nevada--Las Vegas Las Vegas, NV",0.74


In [24]:
college_ugds_

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,0.0333,0.9353,0.0055,0.0019,0.0024,0.0019,0.0000,0.0059,0.0138
University of Alabama at Birmingham,0.5922,0.2600,0.0283,0.0518,0.0022,0.0007,0.0368,0.0179,0.0100
Amridge University,0.2990,0.4192,0.0069,0.0034,0.0000,0.0000,0.0000,0.0000,0.2715
University of Alabama in Huntsville,0.6988,0.1255,0.0382,0.0376,0.0143,0.0002,0.0172,0.0332,0.0350
Alabama State University,0.0158,0.9208,0.0121,0.0019,0.0010,0.0006,0.0098,0.0243,0.0137
The University of Alabama,0.7825,0.1119,0.0348,0.0106,0.0038,0.0009,0.0261,0.0268,0.0026
Central Alabama Community College,0.7255,0.2613,0.0044,0.0025,0.0044,0.0000,0.0000,0.0000,0.0019
Athens State University,0.7823,0.1200,0.0191,0.0053,0.0157,0.0010,0.0174,0.0057,0.0334
Auburn University at Montgomery,0.5328,0.3376,0.0074,0.0221,0.0044,0.0016,0.0297,0.0397,0.0246
Auburn University,0.8507,0.0704,0.0248,0.0227,0.0074,0.0000,0.0000,0.0100,0.0140


In [25]:
college_ugds_.loc['Excel Learning Center-San Antonio South']

UGDS_WHITE   NaN
UGDS_BLACK   NaN
UGDS_HISP    NaN
UGDS_ASIAN   NaN
UGDS_AIAN    NaN
UGDS_NHPI    NaN
UGDS_2MOR    NaN
UGDS_NRA     NaN
UGDS_UNKN    NaN
Name: Excel Learning Center-San Antonio South, dtype: float64

In [26]:
# colleges that are missing all their race columns
college_ugds_.isnull()\
.sum(axis=1)\
.sort_values(ascending=False)\
.head()

INSTNM
Excel Learning Center-San Antonio South         9
Philadelphia College of Osteopathic Medicine    9
Assemblies of God Theological Seminary          9
Episcopal Divinity School                       9
Phillips Graduate Institute                     9
dtype: int64

In [27]:
# Use the dropna method to drop all rows that have all nine race percentages
college_ugds_ = college_ugds_.dropna(how='all')
# We can then count the remaining missing values:   There are no missing values left in the dataset.
college_ugds_.isnull().sum()

UGDS_WHITE    0
UGDS_BLACK    0
UGDS_HISP     0
UGDS_ASIAN    0
UGDS_AIAN     0
UGDS_NHPI     0
UGDS_2MOR     0
UGDS_NRA      0
UGDS_UNKN     0
dtype: int64

In [28]:
'''
Now that we have seen the colleges that are missing all their race columns, we
can use the dropna method to drop all rows that have all nine race percentages
missing. We can then count the remaining missing values:'''

college_ugds_ = college_ugds_.dropna(how='all')
college_ugds_.isnull().sum()

UGDS_WHITE    0
UGDS_BLACK    0
UGDS_HISP     0
UGDS_ASIAN    0
UGDS_AIAN     0
UGDS_NHPI     0
UGDS_2MOR     0
UGDS_NRA      0
UGDS_UNKN     0
dtype: int64

In [29]:
''' There are no missing values left in the dataset. We can now calculate our
diversity metric. To get started, we will use the greater than or equal DataFrame
method, ge, to convert each value to a boolean:'''
college_ugds_.ge(.15)

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Alabama A & M University,False,True,False,False,False,False,False,False,False
University of Alabama at Birmingham,True,True,False,False,False,False,False,False,False
Amridge University,True,True,False,False,False,False,False,False,True
University of Alabama in Huntsville,True,False,False,False,False,False,False,False,False
Alabama State University,False,True,False,False,False,False,False,False,False
The University of Alabama,True,False,False,False,False,False,False,False,False
Central Alabama Community College,True,True,False,False,False,False,False,False,False
Athens State University,True,False,False,False,False,False,False,False,False
Auburn University at Montgomery,True,True,False,False,False,False,False,False,False
Auburn University,True,False,False,False,False,False,False,False,False


In [30]:
'''From here, we can use the sum method to count the True values for each college.
Notice that a Series is returned:'''
diversity_metric = college_ugds_.ge(.15).sum(axis='columns')
diversity_metric.head()

INSTNM
Alabama A & M University               1
University of Alabama at Birmingham    2
Amridge University                     3
University of Alabama in Huntsville    1
Alabama State University               1
dtype: int64

In [37]:
# To get an idea of the distribution, let's use the value_counts method on this Series:
''' Tehát 3042 olyan iskola van, ahol csak egy olyan kisebbség van, amelynek aránya megaladja a 15%-ot'''
diversity_metric.value_counts()


1    3042
2    2884
3     876
4      63
0       7
5       2
dtype: int64

In [34]:
# És csak Két olyan iskola, ahol 5 kisebbség van, amelyek aránya egyenként meghaladja a 15%-ot.
diversity_metric.sort_values(ascending=False).head()

INSTNM
Regency Beauty Institute-Austin          5
Central Texas Beauty College-Temple      5
Sullivan and Cogliano Training Center    4
Ambria College of Nursing                4
Berkeley College-New York                4
dtype: int64

In [39]:
'''It seems a little suspicious that schools can be that diverse. Let's look at the raw
percentages from these top two schools. The .loc indexer is used to specifically
select based on the index label:
It appears that several categories were aggregated into the unknown and two or
more races column. Regardless of this, they both appear to be quite diverse.'''
college_ugds_.loc[['Regency Beauty Institute-Austin','Central Texas Beauty College-Temple']]

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Regency Beauty Institute-Austin,0.1867,0.2133,0.16,0.0,0.0,0.0,0.1733,0.0,0.2667
Central Texas Beauty College-Temple,0.1616,0.2323,0.2626,0.0202,0.0,0.0,0.1717,0.0,0.1515


In [40]:
'''Alternatively, we can find the schools that are least diverse by ordering them by their
maximum race percentage:'''
college_ugds_.max(axis=1).sort_values(ascending=False).head(10)

INSTNM
Dewey University-Manati                               1.0
Yeshiva and Kollel Harbotzas Torah                    1.0
Mr Leon's School of Hair Design-Lewiston              1.0
Dewey University-Bayamon                              1.0
Shepherds Theological Seminary                        1.0
Yeshiva Gedolah Kesser Torah                          1.0
Monteclaro Escuela de Hoteleria y Artes Culinarias    1.0
Yeshiva Shaar Hatorah                                 1.0
Bais Medrash Elyon                                    1.0
Yeshiva of Nitra Rabbinical College                   1.0
dtype: float64

In [41]:
'''We can also determine if any school has all nine race categories exceeding 1%:'''
(college_ugds_ > .01).all(axis=1).any()

True

In [44]:
college_ugds_[(college_ugds_ > .01).all(axis=1)]

Unnamed: 0_level_0,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN
INSTNM,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
John F. Kennedy University,0.3665,0.1554,0.259,0.0837,0.0159,0.012,0.0359,0.0319,0.0398
National Holistic Institute,0.4122,0.0933,0.1889,0.0689,0.0111,0.0278,0.1522,0.0267,0.0189
Santa Fe University of Art and Design,0.4529,0.0703,0.2765,0.0191,0.025,0.0179,0.0751,0.0501,0.0131
Eastern Oregon University,0.7611,0.0294,0.0624,0.0207,0.0254,0.0113,0.0133,0.015,0.0614
New Hope Christian College-Eugene,0.6111,0.037,0.0864,0.037,0.0123,0.0432,0.0926,0.0247,0.0556
Salt Lake Community College,0.6888,0.0248,0.1612,0.0405,0.0104,0.0128,0.0256,0.0132,0.0227
Northwest University,0.6827,0.0447,0.0853,0.0475,0.0124,0.0165,0.0447,0.02,0.0461
South Puget Sound Community College,0.6351,0.0322,0.085,0.0509,0.0125,0.0102,0.0926,0.0112,0.0706
Fashion Institute of Design & Merchandising-San Diego,0.3732,0.0352,0.3732,0.0775,0.0141,0.0282,0.0141,0.0352,0.0493
Northwest College of Art & Design,0.5851,0.0213,0.0957,0.0213,0.0426,0.0213,0.0851,0.0106,0.117
