In [None]:
import numpy as np
import matplotlib.pylab as plt
%matplotlib notebook

In [None]:
# Data from Lee
# https://docs.google.com/spreadsheets/d/1dKz5hnR74_6Vrq4yi8Fg40_syIIWOz9Ynw50noSGKIs/edit#gid=1618407295

'''
Ethnicity	Applicants	Admits	Enrolled
American Indian	86	30	5
Asian	3059	1353	163
Black	5738	1634	157
Hispanic	7239	2974	321
International	861	308	45
Multiracial	1209	589	96
Pacific Islander	3	3	3
Unknown	1667	891	19
White	26428	19245	2922
Total	46290	27027	3731
''';

names = ['Asian', 'Black', 'Hispanic', 'White']

# Asian, Black, Hispanic, White, Other (AI, Int, Multi, PI, Unknown)
siena = np.array([163, 157, 321, 2922])
sienapop = 3731
siena_pct = 100*siena/(sienapop)


'''As of the 2010 census, New York State has a population of 19,378,102, including 
12,740,974 (65.7%) white, 
3,073,800 (15.9%) black, 
1,420,244 (7.3%) Asian, 
8,766 (0.0%) Pacific Islander, and 
1,441,563 (7.4%) of other races. 
585,849 (3.0%) has two or more races. 
Hispanics and Latinos of all races make up 3,416,922 (17.6%) of the state's population; 
non-Hispanic whites make up 58.3% of the state's population.'''
# https://en.wikipedia.org/wiki/Demographics_of_New_York

### How do we parse and compare this with Siena?
nys_pct = np.array([7.3, 15.9, 17.6, 65.7])
nyspop = 19378102
nys = nyspop*(nys_pct/100.)

print(nys.sum()-nys[2])


# Capital district report
# http://capitalregionchamber.com/wp-content/uploads/2015/09/15-9-01-Capital-Region-Statistical-Report.pdf
# 2014
cd = np.array([34316., 75624., 41735., 714292.])
total = 848601.
print(cd[0]+cd[1]+cd[3])
cd_pct = 100*cd/total


In [None]:
plt.figure()
plt.plot(siena_pct,nys_pct,'s',markersize=20,alpha=0.50,label='NY state vs. Siena')
plt.plot(siena_pct,cd_pct,'o',markersize=20,alpha=0.50,label='Capital District vs. Siena')

plt.plot([0,100],[0,100],'--',label="1-to-1")
plt.legend()
plt.xlabel('Siena (%)',fontsize=18)
plt.ylabel('Cap Dist/NY State (%)',fontsize=18)

plt.gca().text(siena_pct[0]-15, cd_pct[0]-5, names[0], fontsize=15)
plt.gca().text(siena_pct[1]-15, cd_pct[1]+5, names[1], fontsize=15)
plt.gca().text(siena_pct[2]+5, cd_pct[2]+5, names[2], fontsize=15)
plt.gca().text(siena_pct[3]+5, 75, names[3], fontsize=15)

plt.tight_layout()


plt.savefig("siena_comp_demos.png")

In [None]:
x = []
y = []

for s in siena:
    
    x.append(np.random.random(s))
    y.append(np.random.random(s))

plt.figure()
markersize = 5
colors = ['r','orange','g','b']
alphas = [1,1,1,0.4]
msizes = [5, 5, 5, 5]
mtypes = ['v','^','s','.']

for xpt,ypt,c,a,m,mt in zip(x,y,colors,alphas,msizes,mtypes):
    
    plt.plot(xpt,ypt,mt,markersize=m,alpha=a,color=c)

plt.axis('off')
plt.text(0.8,0.9,'Siena',fontsize=24,bbox={'facecolor':'white'})
#plt.tight_layout()
plt.subplots_adjust(left=0.01, right=0.99, top=0.99, bottom=0.01)

plt.savefig('siena_asis_color.png')


plt.figure()
markersize = 5
colors = ['b','b','b','b']
alphas = [0.4,0.4,0.4,0.4]
msizes = [5, 5, 5, 5]
mtypes = ['.','.','.','.']

for xpt,ypt,c,a,m in zip(x,y,colors,alphas,msizes):
    
    plt.plot(xpt,ypt,mt,markersize=m,alpha=a,color=c)
    
plt.axis('off')
plt.text(0.8,0.9,'Siena',fontsize=24,bbox={'facecolor':'white'})
#plt.tight_layout()
plt.subplots_adjust(left=0.01, right=0.99, top=0.99, bottom=0.01)

plt.savefig('siena_asis_same.png')

In [None]:
x = []
y = []

for s in nys:
    
    s *= sienapop/nyspop
    print(s)

    x.append(np.random.random(s))
    y.append(np.random.random(s))

    
plt.figure()
markersize = 5
colors = ['r','orange','g','b']
alphas = [1,1,1,0.4]
msizes = [5, 5, 5, 5]
mtypes = ['v','^','s','.']


for xpt,ypt,c,a,m,mt in zip(x,y,colors,alphas,msizes,mtypes):
    
    plt.plot(xpt,ypt,mt,markersize=m,alpha=a,color=c)

plt.axis('off')
plt.text(0.6,0.9,'Siena as NYS',fontsize=24,bbox={'facecolor':'white'})

#plt.tight_layout()
plt.subplots_adjust(left=0.01, right=0.99, top=0.99, bottom=0.01)

plt.savefig('siena_nys_color.png')


plt.figure()
markersize = 5
colors = ['b','b','b','b']
alphas = [0.4,0.4,0.4,0.4]
msizes = [5, 5, 5, 5]

for xpt,ypt,c,a,m in zip(x,y,colors,alphas,msizes):
    
    plt.plot(xpt,ypt,'.',markersize=m,alpha=a,color=c)
    
plt.axis('off')
plt.text(0.6,0.9,'Siena as NYS',fontsize=24,bbox={'facecolor':'white'})

#plt.tight_layout()
plt.subplots_adjust(left=0.01, right=0.99, top=0.99, bottom=0.01)

plt.savefig('siena_nys_same.png')