## Transform

Transform data (extracted as 51 individual CSV files) into one large dataframe. Clean up and create unique rows and columns

In [1]:
import pandas as pd

In [2]:
# Read CSV
alabama = pd.read_csv("../Data/States/Alabama.csv")

In [3]:
# Set Age (AGEP) as index
alabama = alabama.set_index("Age (AGEP)")
alabama.head()

Unnamed: 0_level_0,Total,Alabama/AL,Alaska/AK,Arizona/AZ,Arkansas/AR,California/CA,Colorado/CO,Connecticut/CT,Delaware/DE,District of Columbia/DC,...,"South America, Not Specified",Egypt,Ethiopia (2017 or later),Kenya (2017 or later),Nigeria,"Western Africa, Not Specified","Northern Africa or Other Africa, Not Specified","Eastern Africa, Not Specified",Australia,"Other US Island Areas, Oceania, Not Specified, or At Sea"
Age (AGEP),Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
-> Total,319852,253611,429,868,859,1674,983,393,64,167,...,162,36,0,12,105,0,69,103,109,128
-> Total ->,319852,253611,429,868,859,1674,983,393,64,167,...,162,36,0,12,105,0,69,103,109,128
Total 12th grade - no diploma,7237,5807,0,4,0,63,9,99,0,0,...,0,0,0,0,0,0,0,0,0,0
25 years Total 12th grade - no diploma,260,191,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
26 years Total 12th grade - no diploma,336,287,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [4]:
# Transpose to switch rows with columns
alabama_df = alabama.T

In [5]:
# Add "To_State" so that each origin state on far left shows which state they moved to on far right
# Makes data multi-dimensional

alabama_df["To_State"] = "Alabama"


In [6]:
# Code for one state
alabama = pd.read_csv("../Data/States/Alabama.csv").set_index("Age (AGEP)").T
alabama["To_State"] = "Alabama"
alabama.head()

Age (AGEP),-> Total,-> Total ->,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,31 years Total 12th grade - no diploma,...,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree,To_State
Total,319852,319852,7237,260,336,227,132,275,265,339,...,32,2,2,31,0,4,8,10,60,Alabama
Alabama/AL,253611,253611,5807,191,287,227,125,163,178,231,...,13,2,0,31,0,4,8,0,45,Alabama
Alaska/AK,429,429,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
Arizona/AZ,868,868,4,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
Arkansas/AR,859,859,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama


In [7]:
list(alabama.columns)

[' -> Total',
 ' -> Total ->',
 'Total 12th grade - no diploma',
 '25 years Total 12th grade - no diploma',
 '26 years Total 12th grade - no diploma',
 '27 years Total 12th grade - no diploma',
 '28 years Total 12th grade - no diploma',
 '29 years Total 12th grade - no diploma',
 '30 years Total 12th grade - no diploma',
 '31 years Total 12th grade - no diploma',
 '32 years Total 12th grade - no diploma',
 '33 years Total 12th grade - no diploma',
 '34 years Total 12th grade - no diploma',
 '35 years Total 12th grade - no diploma',
 '36 years Total 12th grade - no diploma',
 '37 years Total 12th grade - no diploma',
 '38 years Total 12th grade - no diploma',
 '39 years Total 12th grade - no diploma',
 '40 years Total 12th grade - no diploma',
 '41 years Total 12th grade - no diploma',
 '42 years Total 12th grade - no diploma',
 '43 years Total 12th grade - no diploma',
 '44 years Total 12th grade - no diploma',
 '45 years Total 12th grade - no diploma',
 '46 years Total 12th grade - no

In [8]:
# All states in Data folder
states_list = ["Alabama", "Alaska", "Arizona", "Arkansas", "California", "Colorado", "Connecticut", \
               "Delaware", "District of Columbia", "Florida", "Georgia", "Hawaii", "Idaho", "Illinois", \
              "Indiana", "Iowa", "Kansas", "Kentucky", "Louisiana", "Maine", "Maryland", "Massachusetts", \
              "Michigan", "Minnesota", "Mississippi", "Missouri", "Montana", "Nebraska", "Nevada", "New Hampshire", \
              "New Jersey", "New Mexico", "New York", "North Carolina", "North Dakota", "Ohio", "Oklahoma", "Oregon", \
              "Pennsylvania", "Rhode Island", "South Carolina", "South Dakota", "Tennessee", "Texas", "Utah", \
              "Vermont", "Virginia", "Washington", "West Virginia", "Wisconsin", "Wyoming"]

# Dictionary to hold state name as key, dataframe as value
dict_state = {}

# For loop to iterate through all states to shape data
for state in states_list:
    df = pd.read_csv(f'../Data/States/{state}.csv').rename(columns = {"Age (AGEP)":"Origin"}).set_index("Origin").T
    df["To_State"] = f'{state}'
    dict_state[state] = df


In [9]:
# Can call any state dataframe when using state name as dictionary key
dict_state["California"]

Origin,-> Total,-> Total ->,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,31 years Total 12th grade - no diploma,...,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree,To_State
Total,2681950,2681950,66579,2445,2779,2252,2453,2790,2382,2088,...,336,392,619,460,364,547,286,433,201,California
Alabama/AL,2174,2174,41,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,California
Alaska/AK,2083,2083,16,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,California
Arizona/AZ,17511,17511,278,1,0,0,32,28,0,0,...,0,0,0,12,0,0,0,0,0,California
Arkansas/AR,1882,1882,69,0,0,0,0,31,0,0,...,0,0,0,0,0,0,0,0,0,California
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
"Western Africa, Not Specified",339,339,24,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,California
"Northern Africa or Other Africa, Not Specified",1068,1068,25,0,0,0,0,0,11,0,...,0,0,0,0,0,0,0,0,0,California
"Eastern Africa, Not Specified",561,561,107,0,0,66,0,41,0,0,...,0,0,0,0,0,0,0,0,0,California
Australia,3401,3401,33,0,0,0,0,0,0,12,...,0,0,0,0,0,0,0,0,0,California


In [10]:
df = pd.concat(dict_state.values(), ignore_index=False)

In [11]:
df.head()


Origin,-> Total,-> Total ->,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,31 years Total 12th grade - no diploma,...,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree,To_State
Total,319852,319852,7237,260,336,227,132,275,265,339,...,32,2,2,31,0,4,8,10,60,Alabama
Alabama/AL,253611,253611,5807,191,287,227,125,163,178,231,...,13,2,0,31,0,4,8,0,45,Alabama
Alaska/AK,429,429,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
Arizona/AZ,868,868,4,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
Arkansas/AR,859,859,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama


## Load

Create engine and load all_states_df into SQL database

In [12]:
# Dependencies
from login import port, pw
from sqlalchemy import create_engine
from sqlalchemy.ext.automap import automap_base
from config import user, pw, port

In [13]:
# Create engine
engine = create_engine(f'postgresql://{user}:{pw}@localhost:{port}/interstate_migration_db')
# engine = create_engine("postgresql://postgres:postgres@localhost:5432/interstate_migration_db")

# Connect to pgAdmin 4
conn = engine.connect()

In [14]:
base = automap_base()
base.prepare(engine, reflect=True)
base.classes.keys()

[]

In [15]:
# Load all_states_df into Postgres database
df.to_sql(name="states", con=engine, if_exists="replace", index=True)

In [16]:
# Confirm table names
engine.table_names()

['states_clean', 'states']

In [17]:
# Query database for all listings from states
df2 = pd.read_sql_query("SELECT * FROM states", con=engine)
df2

Unnamed: 0,index,-> Total,-> Total ->,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,...,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree,To_State
0,Total,319852,319852,7237,260,336,227,132,275,265,...,32,2,2,31,0,4,8,10,60,Alabama
1,Alabama/AL,253611,253611,5807,191,287,227,125,163,178,...,13,2,0,31,0,4,8,0,45,Alabama
2,Alaska/AK,429,429,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
3,Arizona/AZ,868,868,4,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
4,Arkansas/AR,859,859,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Alabama
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5554,"Western Africa, Not Specified",0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Wyoming
5555,"Northern Africa or Other Africa, Not Specified",0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Wyoming
5556,"Eastern Africa, Not Specified",54,54,54,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Wyoming
5557,Australia,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Wyoming


In [18]:
# Keep
df2 = df2.rename(columns={"index":"Origin"})

In [19]:
# Keep
df2.set_index(["To_State", "Origin"], inplace=True)

In [20]:
# Keep
df2.rename(columns={df.columns[0]: "Total", df.columns[1]: "Total2"}, inplace=True)
df2 = df2.drop(columns=["Total2"])
df2

Unnamed: 0_level_0,Unnamed: 1_level_0,Total,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,31 years Total 12th grade - no diploma,32 years Total 12th grade - no diploma,...,66 years Total Doctorate degree,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree
To_State,Origin,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1
Alabama,Total,319852,7237,260,336,227,132,275,265,339,263,...,44,32,2,2,31,0,4,8,10,60
Alabama,Alabama/AL,253611,5807,191,287,227,125,163,178,231,218,...,31,13,2,0,31,0,4,8,0,45
Alabama,Alaska/AK,429,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
Alabama,Arizona/AZ,868,4,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
Alabama,Arkansas/AR,859,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Wyoming,"Western Africa, Not Specified",0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
Wyoming,"Northern Africa or Other Africa, Not Specified",0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
Wyoming,"Eastern Africa, Not Specified",54,54,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
Wyoming,Australia,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [21]:
df2.to_sql("states_clean", conn, if_exists="replace", index=True)

In [22]:
# Query database for all listings from states
df2 = pd.read_sql_query("SELECT * FROM states_clean", con=engine)
df2

Unnamed: 0,To_State,Origin,Total,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,...,66 years Total Doctorate degree,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree
0,Alabama,Total,319852,7237,260,336,227,132,275,265,...,44,32,2,2,31,0,4,8,10,60
1,Alabama,Alabama/AL,253611,5807,191,287,227,125,163,178,...,31,13,2,0,31,0,4,8,0,45
2,Alabama,Alaska/AK,429,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
3,Alabama,Arizona/AZ,868,4,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
4,Alabama,Arkansas/AR,859,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5554,Wyoming,"Western Africa, Not Specified",0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5555,Wyoming,"Northern Africa or Other Africa, Not Specified",0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5556,Wyoming,"Eastern Africa, Not Specified",54,54,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5557,Wyoming,Australia,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [23]:
all_states = ['Alabama', 'Alaska', 'Arizona', 'Arkansas', 'California',
       'Colorado', 'Connecticut', 'Delaware', 'District of Columbia',
       'Florida', 'Georgia', 'Hawaii', 'Idaho', 'Illinois', 'Indiana',
       'Iowa', 'Kansas', 'Kentucky', 'Louisiana', 'Maine', 'Maryland',
       'Massachusetts', 'Michigan', 'Minnesota', 'Mississippi',
       'Missouri', 'Montana', 'Nebraska', 'Nevada', 'New Hampshire',
       'New Jersey', 'New Mexico', 'New York', 'North Carolina',
       'North Dakota', 'Ohio', 'Oklahoma', 'Oregon', 'Pennsylvania',
       'Rhode Island', 'South Carolina', 'South Dakota', 'Tennessee',
       'Texas', 'Utah', 'Vermont', 'Virginia', 'Washington',
       'West Virginia', 'Wisconsin', 'Wyoming']

# Checks all states for state contained in origin, then renames Origin to match To_State names
all_df = []
for x in all_states:
    df3 = df2[df2["Origin"].str.contains(x)].copy()
    df3["Origin"] = x
    all_df.append(df3)

In [37]:
df_final = pd.concat(all_df)

In [38]:
# Renamed origin states to match to state
df_final

Unnamed: 0,To_State,Origin,Total,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,...,66 years Total Doctorate degree,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree
1,Alabama,Alabama,253611,5807,191,287,227,125,163,178,...,31,13,2,0,31,0,4,8,0,45
110,Alaska,Alabama,227,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
219,Arizona,Alabama,661,9,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
328,Arkansas,Alabama,431,26,3,0,0,23,0,0,...,0,0,0,0,0,0,0,0,0,0
437,California,Alabama,2174,41,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5065,Virginia,Wyoming,58,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5174,Washington,Wyoming,674,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5283,West Virginia,Wyoming,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5392,Wisconsin,Wyoming,353,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [39]:
#     df = pd.read_csv(f'../Data/States/{state}.csv').rename(columns = {"Age (AGEP)":"Origin"}).set_index("Origin").T
#     df["To_State"] = f'{state}'
#     dict_state[state] = df

In [40]:
no_dupes = {}
for x in df_final["To_State"].unique():
    df_t = df_final[(df_final["Origin"].isin(all_states)) & (df_final["To_State"]!=x)]
    df_t = df_t[df_t['Origin'] == x]
    no_dupes[x] = df_t
    
    

In [41]:
no_dupes["California"]

Unnamed: 0,To_State,Origin,Total,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,...,66 years Total Doctorate degree,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree
5,Alabama,California,1674,63,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
114,Alaska,California,2075,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
223,Arizona,California,35420,714,21,15,49,0,53,0,...,22,59,52,21,0,12,0,0,9,0
332,Arkansas,California,2511,51,0,0,34,0,17,0,...,0,0,0,6,0,0,0,0,0,0
550,Colorado,California,15176,185,60,0,9,0,24,0,...,24,0,0,0,0,0,0,0,0,17
659,Connecticut,California,2275,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
768,Delaware,California,223,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
877,District of Columbia,California,1938,0,0,0,0,0,0,0,...,0,0,0,0,43,0,0,0,24,0
986,Florida,California,16777,316,0,0,29,0,16,76,...,0,0,0,0,10,10,0,0,32,8
1095,Georgia,California,9704,179,0,0,0,0,17,0,...,0,11,22,0,0,0,0,0,0,0


In [42]:
no_dupes_df = pd.concat(no_dupes.values(), ignore_index=False)

In [43]:
no_dupes_df

Unnamed: 0,To_State,Origin,Total,Total 12th grade - no diploma,25 years Total 12th grade - no diploma,26 years Total 12th grade - no diploma,27 years Total 12th grade - no diploma,28 years Total 12th grade - no diploma,29 years Total 12th grade - no diploma,30 years Total 12th grade - no diploma,...,66 years Total Doctorate degree,67 years Total Doctorate degree,68 years Total Doctorate degree,69 years Total Doctorate degree,70 years Total Doctorate degree,71 years Total Doctorate degree,72 years Total Doctorate degree,73 years Total Doctorate degree,74 years Total Doctorate degree,75 years Total Doctorate degree
110,Alaska,Alabama,227,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
219,Arizona,Alabama,661,9,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
328,Arkansas,Alabama,431,26,3,0,0,23,0,0,...,0,0,0,0,0,0,0,0,0,0
437,California,Alabama,2174,41,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
546,Colorado,Alabama,1463,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4956,Vermont,Wyoming,9,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5065,Virginia,Wyoming,58,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5174,Washington,Wyoming,674,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
5283,West Virginia,Wyoming,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [44]:
wyoming_df = df_t[df_t['Origin'] == "Wyoming"]
wyoming_df['Total'].sum()

14696