In [1]:
%matplotlib notebook

import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import scipy.stats as st

Consumer1_path = pd.read_csv("ConsumptionReports/Consumption1.csv")
Consumer1_path.columns= ['State', 
                         'Total Personal Consumption Expenditures 2019', 
                         'Housing/Util.', 
                         'Healthcare', 
                         'Off-premises Food/Bev', 
                         'Gasoline/Energy', 
                         'All other Personal Consumptions'] 
Consumer1_path= Consumer1_path.drop(labels=[0,1,2,3,10,17,23,29,31,44,49,55], axis=0)
Consumer1_path= Consumer1_path.reset_index(drop=True)
Consumer1_path.head()

Unnamed: 0,State,Total Personal Consumption Expenditures 2019,Housing/Util.,Healthcare,Off-premises Food/Bev,Gasoline/Energy,All other Personal Consumptions
0,Connecticut,54786,11140,8218,3399,1062,30967
1,Maine,47351,7444,8216,4299,1889,25503
2,Massachusetts,56231,10710,9324,3761,885,31551
3,New Hampshire,54585,10180,9380,4091,1531,29403
4,Rhode Island,47045,9248,7889,3393,1043,25472


In [2]:
Consumer2_path = pd.read_csv("ConsumptionReports/Consumption2.csv")
Consumer2_path.columns= ['State', 
                         '$ by Millions 2017',
                         '$ by Millions 2018', 
                         'Total State Expenditure by Millions 2019', 
                         'Percent Change 2017-18', 
                         'Percent Change 2018-19']
Consumer2_path= Consumer2_path.drop(labels=[0,1,2,3,10,17,23,29,31,44,49,55], axis=0)
Consumer2_path= Consumer2_path.reset_index(drop=True)
Consumer2_path.head()

Unnamed: 0,State,$ by Millions 2017,$ by Millions 2018,Total State Expenditure by Millions 2019,Percent Change 2017-18,Percent Change 2018-19
0,Connecticut,182612,189857.0,195327.0,4.0,2.9
1,Maine,58853,61593.0,63650.0,4.7,3.3
2,Massachusetts,359649,374378.0,387570.0,4.1,3.5
3,New Hampshire,68532,71592.0,74220.0,4.5,3.7
4,Rhode Island,46363,48316.0,49838.0,4.2,3.2


In [3]:
Total_consumption = pd.merge(Consumer1_path, Consumer2_path, left_index=True, on='State')
Total_consumption.head()

Unnamed: 0,State,Total Personal Consumption Expenditures 2019,Housing/Util.,Healthcare,Off-premises Food/Bev,Gasoline/Energy,All other Personal Consumptions,$ by Millions 2017,$ by Millions 2018,Total State Expenditure by Millions 2019,Percent Change 2017-18,Percent Change 2018-19
0,Connecticut,54786,11140,8218,3399,1062,30967,182612,189857.0,195327.0,4.0,2.9
1,Maine,47351,7444,8216,4299,1889,25503,58853,61593.0,63650.0,4.7,3.3
2,Massachusetts,56231,10710,9324,3761,885,31551,359649,374378.0,387570.0,4.1,3.5
3,New Hampshire,54585,10180,9380,4091,1531,29403,68532,71592.0,74220.0,4.5,3.7
4,Rhode Island,47045,9248,7889,3393,1043,25472,46363,48316.0,49838.0,4.2,3.2


In [4]:
Total_consumption= Total_consumption.drop(['$ by Millions 2017', '$ by Millions 2018', "Percent Change 2017-18"],axis=1)
Total_consumption

Unnamed: 0,State,Total Personal Consumption Expenditures 2019,Housing/Util.,Healthcare,Off-premises Food/Bev,Gasoline/Energy,All other Personal Consumptions,Total State Expenditure by Millions 2019,Percent Change 2018-19
0,Connecticut,54786,11140,8218,3399,1062,30967,195327.0,2.9
1,Maine,47351,7444,8216,4299,1889,25503,63650.0,3.3
2,Massachusetts,56231,10710,9324,3761,885,31551,387570.0,3.5
3,New Hampshire,54585,10180,9380,4091,1531,29403,74220.0,3.7
4,Rhode Island,47045,9248,7889,3393,1043,25472,49838.0,3.2
5,Vermont,49377,9018,9012,4206,1603,25538,30811.0,1.8
6,Delaware,45827,8335,9071,3468,1170,23783,44625.0,3.3
7,District of Columbia,65352,11936,10487,4058,696,38176,46122.0,3.2
8,Maryland,47529,11051,7717,2866,908,24986,287344.0,2.9
9,New Jersey,54216,11215,8229,3442,867,30463,481554.0,3.8


In [5]:
convert_dict = {'Total Personal Consumption Expenditures 2019': float,
                'Off-premises Food/Bev': float}

Total_consumption= Total_consumption.astype(convert_dict)
print(Total_consumption.dtypes)

State                                            object
Total Personal Consumption Expenditures 2019    float64
Housing/Util.                                    object
Healthcare                                       object
Off-premises Food/Bev                           float64
Gasoline/Energy                                  object
All other Personal Consumptions                  object
Total State Expenditure by Millions 2019        float64
Percent Change 2018-19                          float64
dtype: object


In [6]:
Total_consumption.plot(x='State', y='Total Personal Consumption Expenditures 2019' , kind='bar', figsize=(7,5)) 
plt.title("Personal Expenditures")
plt.xlabel("State Name")
plt.ylabel("Yearly Expenditures ")
plt.tight_layout()
plt.show
plt.savefig("../Personal_consumption_exp.png")

<IPython.core.display.Javascript object>

In [7]:
Total_consumption.plot(x='State', y='Total State Expenditure by Millions 2019', kind='bar', figsize=(7,5)) 
plt.title("State Expenditures")
plt.xlabel("State Name")
plt.ylabel("Yearly Expenditures ")
plt.tight_layout()
plt.show
plt.savefig("../State_consumption_exp.png")

<IPython.core.display.Javascript object>

In [1]:
Total_consumption.plot(x='State', y=['Total State Expenditure by Millions 2019','Total Personal Consumption Expenditures 2019'] , kind='bar', figsize=(7,5)) 
plt.title("Personal vs State Expenditures")
plt.xlabel("State Name")
plt.ylabel("Yearly Expenditures ")
plt.tight_layout()
plt.savefig("../Pers_vs_state_consume.png")
plt.show

NameError: name 'Total_consumption' is not defined