In [1]:
import pandas as pd
import numpy as np
import glob
import os
import matplotlib.pyplot as plt
import completions_module as cmodule

This notebook contains various tables for `Physical Sciences` degrees (2009-2019).

- Table 1: Bachelors / Hispanic + Latinx (total sum for year range)
- Table 2: Bachelors / Hispanic + Latinx (annual mean for year range)
- Table 3: Bachelors / Grand total (total sum for year range)
- Table 4: Bachelors / Grand total (annual mean for year range)

- Table 5: Masters / Hispanic + Latinx (total sum for year range)
- Table 6: Masters / Hispanic + Latinx (annual mean for year range)
- Table 7: Masters / Grand total (total sum for year range)
- Table 8: Masters / Grand total (annual mean for year range)

- Table 9: Doctorate / Hispanic + Latinx (total sum for year range)
- Table 10: Doctorate / Hispanic + Latinx (annual mean for year range)
- Table 11: Doctorate / Grand total (total sum for year range)
- Table 12: Doctorate / Grand total (annual mean for year range)


_Author: Maria J. Molina (molina@ucar.edu)_

In [2]:
all_files = glob.glob("../data/completions_*.csv")
all_files = sorted(all_files)

### Top 30 US institutions: Hispanic/Latinx bachelor degree recipients in the Physical Sciences (2009-2019)

In [3]:
df = cmodule.open_and_concat(all_files)
df = cmodule.bs_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').sum()['Hispanic or Latino total'].sort_values(ascending=False).head(30)  # TOTAL SUM (2009-2019)

institution name
Florida International University               876
The University of Texas at Austin              510
The University of Texas at El Paso             365
Texas A & M University-College Station         356
University of California-San Diego             341
University of California-Irvine                323
University of Houston                          302
University of California-Berkeley              260
University of California-Los Angeles           249
University of Arizona                          238
University of California-Davis                 209
United States Naval Academy                    191
San Diego State University                     190
University of Washington-Seattle Campus        189
University of South Florida-Main Campus        180
University of Illinois at Urbana-Champaign     179
Florida State University                       175
Texas A & M University-Corpus Christi          155
Northern Arizona University                    153
Pennsylvania S

In [4]:
df = cmodule.open_and_concat(all_files)
df = cmodule.bs_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').mean()['Hispanic or Latino total'].sort_values(ascending=False).head(30)  # ANNUAL MEAN (2009-2019)

institution name
The University of Texas at Austin                46.363636
Florida International University                 46.105263
University of Houston                            27.454545
Texas A & M University-College Station           18.736842
The University of Texas at El Paso               18.250000
University of California-San Diego               15.500000
University of California-Irvine                  14.681818
United States Naval Academy                      13.642857
Pennsylvania State University-Main Campus        13.636364
Texas A & M University-Corpus Christi            12.916667
University of South Florida-Main Campus          12.000000
University of California-Los Angeles             11.857143
University of California-Berkeley                11.818182
Arizona State University-Tempe                   11.461538
CUNY Graduate School and University Center       11.375000
University of Arizona                            10.818182
Rutgers University-New Brunswick       

### Top 30 US institutions: Grand Total bachelor degree recipients in the Physical Sciences (2009-2019)

In [6]:
df = cmodule.open_and_concat(all_files)
df = cmodule.bs_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').sum()['Grand total'].sort_values(ascending=False).head(30)  # TOTAL SUM (2009-2019)

institution name
Pennsylvania State University-Main Campus              3827
University of Washington-Seattle Campus                3590
University of California-Berkeley                      3337
University of California-San Diego                     3143
The University of Texas at Austin                      2848
University of Illinois at Urbana-Champaign             2648
University of North Carolina at Chapel Hill            2398
University of Minnesota-Twin Cities                    2358
University of California-Irvine                        2174
Texas A & M University-College Station                 2165
University of Wisconsin-Madison                        1887
University of California-Los Angeles                   1825
University of Virginia-Main Campus                     1749
University of Arizona                                  1727
University of California-Davis                         1672
United States Naval Academy                            1641
University of Maryland-

In [8]:
df = cmodule.open_and_concat(all_files)
df = cmodule.bs_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').mean()['Grand total'].sort_values(ascending=False).head(30)  # ANNUAL MEAN (2009-2019)

institution name
Pennsylvania State University-Main Campus      347.909091
The University of Texas at Austin              258.909091
University of Washington-Seattle Campus        163.181818
University of California-Berkeley              151.681818
University of California-San Diego             142.863636
Michigan State University                      140.818182
University of Houston                          128.454545
Rutgers University-New Brunswick               125.454545
University of Illinois at Urbana-Champaign     120.363636
United States Naval Academy                    117.214286
University of Utah                             115.846154
Texas A & M University-College Station         113.947368
University of North Carolina at Chapel Hill    109.000000
University of Minnesota-Twin Cities            107.181818
Mississippi State University                    99.363636
University of California-Irvine                 98.818182
University of Oklahoma-Norman Campus            98.3076

### Top 30 US institutions: Hispanic/Latinx master degree recipients in the Physical Sciences (2009-2019)

In [13]:
df = cmodule.open_and_concat(all_files)
df = cmodule.ms_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').sum()['Hispanic or Latino total'].sort_values(ascending=False).head(30)  # TOTAL SUM (2009-2019)

institution name
University of California-San Diego             86
The University of Texas at El Paso             81
University of Arizona                          70
Johns Hopkins University                       64
University of California-Los Angeles           63
Texas A & M University-College Station         62
CUNY Graduate School and University Center     58
Stanford University                            57
Florida International University               57
University of Houston                          54
University of Michigan-Ann Arbor               54
University of California-Berkeley              42
Pennsylvania State University-Main Campus      40
University of Washington-Seattle Campus        37
Florida State University                       36
The University of Texas at Austin              36
Columbia University in the City of New York    34
University of Wisconsin-Madison                34
University of California-Irvine                33
San Diego State University       

In [14]:
df = cmodule.open_and_concat(all_files)
df = cmodule.ms_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').mean()['Hispanic or Latino total'].sort_values(ascending=False).head(30)  # annual mean (2009-2019)

institution name
University of California-San Diego             7.818182
The University of Texas at El Paso             7.363636
University of Arizona                          6.363636
Johns Hopkins University                       5.818182
CUNY Graduate School and University Center     5.800000
University of California-Los Angeles           5.727273
Texas A & M University-College Station         5.636364
Florida International University               5.181818
Stanford University                            5.181818
University of Michigan-Ann Arbor               4.909091
University of Houston                          4.909091
University of California-Berkeley              3.818182
Pennsylvania State University-Main Campus      3.636364
Florida State University                       3.272727
The University of Texas at Austin              3.272727
University of Wisconsin-Madison                3.090909
Columbia University in the City of New York    3.090909
University of California-Irvine

### Top 30 US institutions: Grand total master degree recipients in the Physical Sciences (2009-2019)

In [11]:
df = cmodule.open_and_concat(all_files)
df = cmodule.ms_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').sum()['Grand total'].sort_values(ascending=False).head(30)  # TOTAL SUM (2009-2019)

institution name
Johns Hopkins University                       1361
University of California-San Diego             1109
University of Arizona                          1065
Mississippi State University                   1061
University of Washington-Seattle Campus         991
Columbia University in the City of New York     899
University of Michigan-Ann Arbor                885
University of California-Los Angeles            807
University of Houston                           777
University of California-Berkeley               770
University of Chicago                           763
Texas A & M University-College Station          741
Cornell University                              733
University of Wisconsin-Madison                 733
Florida State University                        716
University of Oklahoma-Norman Campus            704
Princeton University                            684
Yale University                                 682
Rice University                                

In [12]:
df = cmodule.open_and_concat(all_files)
df = cmodule.ms_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').mean()['Grand total'].sort_values(ascending=False).head(30)  # annual mean (2009-2019)

institution name
Johns Hopkins University                       123.727273
University of California-San Diego             100.818182
University of Arizona                           96.818182
Mississippi State University                    96.454545
Columbia University in the City of New York     81.727273
University of Michigan-Ann Arbor                80.454545
University of California-Los Angeles            73.363636
University of Washington-Seattle Campus         70.785714
University of Houston                           70.636364
University of California-Berkeley               70.000000
University of Chicago                           69.363636
Texas A & M University-College Station          67.363636
Cornell University                              66.636364
University of Wisconsin-Madison                 66.636364
Florida State University                        65.090909
University of Oklahoma-Norman Campus            64.000000
Princeton University                            62.1818

### Top 30 US institutions: Hispanic/Latinx doctorate degree recipients in the Physical Sciences (2009-2019)

In [15]:
df = cmodule.open_and_concat(all_files)
df = cmodule.phd_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').sum()['Hispanic or Latino total'].sort_values(ascending=False).head(30)  # total sum (2009-2019)

institution name
University of California-Berkeley              63
University of California-San Diego             49
University of California-Los Angeles           46
Florida International University               46
CUNY Graduate School and University Center     44
The University of Texas at Austin              43
Texas A & M University-College Station         39
Massachusetts Institute of Technology          37
Stanford University                            36
Pennsylvania State University-Main Campus      36
University of California-Irvine                34
University of California-Davis                 33
University of Michigan-Ann Arbor               32
Purdue University-Main Campus                  28
University of Arizona                          28
University of South Florida-Main Campus        26
California Institute of Technology             25
Columbia University in the City of New York    25
Rice University                                24
University of Wisconsin-Madison  

In [16]:
df = cmodule.open_and_concat(all_files)
df = cmodule.phd_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').mean()['Hispanic or Latino total'].sort_values(ascending=False).head(30)  # annual mean (2009-2019)

institution name
University of California-Berkeley              5.727273
University of California-San Diego             4.454545
Florida International University               4.181818
University of California-Los Angeles           4.181818
CUNY Graduate School and University Center     4.000000
The University of Texas at Austin              3.909091
Texas A & M University-College Station         3.545455
Massachusetts Institute of Technology          3.363636
Pennsylvania State University-Main Campus      3.272727
Stanford University                            3.272727
University of California-Irvine                3.090909
University of California-Davis                 3.000000
University of Michigan-Ann Arbor               2.909091
University of Arizona                          2.545455
Purdue University-Main Campus                  2.545455
University of South Florida-Main Campus        2.363636
California Institute of Technology             2.272727
Columbia University in the City

### Top 30 US institutions: Grand total doctorate degree recipients in the Physical Sciences (2009-2019)

In [9]:
df = cmodule.open_and_concat(all_files)
df = cmodule.phd_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').sum()['Grand total'].sort_values(ascending=False).head(30)  # TOTAL SUM (2009-2019)

institution name
University of California-Berkeley              1390
Stanford University                            1178
Massachusetts Institute of Technology          1097
University of Michigan-Ann Arbor               1064
University of Illinois at Urbana-Champaign     1042
The University of Texas at Austin               996
University of Wisconsin-Madison                 978
University of California-San Diego              942
Purdue University-Main Campus                   930
University of Arizona                           912
Harvard University                              907
Texas A & M University-College Station          881
Pennsylvania State University-Main Campus       868
University of Washington-Seattle Campus         850
California Institute of Technology              807
University of California-Los Angeles            785
University of Colorado Boulder                  783
Ohio State University-Main Campus               778
University of Maryland-College Park            

In [10]:
df = cmodule.open_and_concat(all_files)
df = cmodule.phd_degrees(df)
df = cmodule.physical_sciences(df)
df.groupby('institution name').mean()['Grand total'].sort_values(ascending=False).head(30)  # annual mean (2009-2019)

institution name
University of California-Berkeley              126.363636
Stanford University                            107.090909
Massachusetts Institute of Technology           99.727273
University of Michigan-Ann Arbor                96.727273
University of Illinois at Urbana-Champaign      94.727273
The University of Texas at Austin               90.545455
University of Wisconsin-Madison                 88.909091
University of California-San Diego              85.636364
Purdue University-Main Campus                   84.545455
University of Arizona                           82.909091
Harvard University                              82.454545
Texas A & M University-College Station          80.090909
Pennsylvania State University-Main Campus       78.909091
California Institute of Technology              73.363636
University of California-Los Angeles            71.363636
Ohio State University-Main Campus               70.727273
University of Maryland-College Park             68.2727