In [1]:
# Setup
import pandas as pd

In [2]:
# Get, read, and turn csv into dataframe
income_df = pd.read_csv("Resources/income_vs_year.csv")
gdp_df = pd.read_csv("Resources/GDP_1969_2020.csv")

In [3]:
# Show initial income_df
income_df

Unnamed: 0,Year,Population (No. of People),Disposable Personal Income (Millions of Dollars),Personal Income (Millions of Dollars),Per Capita Disposable Personal Income (Dollars),Per Capita Personal Income (Dollars)
0,1969,201298000,"$687,425.00","$791,229.00","$3,415","$3,931"
1,1970,203798722,"$753,099.00","$855,525.00","$3,695","$4,198"
2,1971,206817509,"$823,437.00","$924,613.00","$3,981","$4,471"
3,1972,209274882,"$893,321.00","$1,016,408.00","$4,269","$4,857"
4,1973,211349205,"$1,001,571.00","$1,133,468.00","$4,739","$5,363"
5,1974,213333635,"$1,094,397.00","$1,244,912.00","$5,130","$5,836"
6,1975,215456585,"$1,215,359.00","$1,362,505.00","$5,641","$6,324"
7,1976,217553859,"$1,323,488.00","$1,495,704.00","$6,083","$6,875"
8,1977,219760875,"$1,454,268.00","$1,651,632.00","$6,618","$7,516"
9,1978,222098244,"$1,626,753.00","$1,855,849.00","$7,324","$8,356"


In [4]:
# Show initial gdp_df
gdp_df

Unnamed: 0,Years,GDP
0,1969,962901.7
1,1970,1012299.3
2,1971,1097173.4
3,1972,1210292.4
4,1973,1356499.7
5,1974,1472024.2
6,1975,1602227.6
7,1976,1780497.3
8,1977,1986407.7
9,1978,2243230.1


In [5]:
# Rename gdp_df "Years" to "Year" for easier merging
# Add GDP units to column name for readability
gdp_df = gdp_df.rename(columns={"Years": "Year", "GDP": "GDP (Dollars)"})

# Format GDP column
gdp_df["GDP (Dollars)"] = gdp_df["GDP (Dollars)"].map("${:,.2f}".format)

gdp_df.head()

Unnamed: 0,Year,GDP (Dollars)
0,1969,"$962,901.70"
1,1970,"$1,012,299.30"
2,1971,"$1,097,173.40"
3,1972,"$1,210,292.40"
4,1973,"$1,356,499.70"


In [6]:
# Merge gdp_df and income_df on year
gdp_income_df = pd.merge(gdp_df, income_df, how="outer", on="Year")

In [7]:
# Display combined df
gdp_income_df

Unnamed: 0,Year,GDP (Dollars),Population (No. of People),Disposable Personal Income (Millions of Dollars),Personal Income (Millions of Dollars),Per Capita Disposable Personal Income (Dollars),Per Capita Personal Income (Dollars)
0,1969,"$962,901.70",201298000.0,"$687,425.00","$791,229.00","$3,415","$3,931"
1,1970,"$1,012,299.30",203798722.0,"$753,099.00","$855,525.00","$3,695","$4,198"
2,1971,"$1,097,173.40",206817509.0,"$823,437.00","$924,613.00","$3,981","$4,471"
3,1972,"$1,210,292.40",209274882.0,"$893,321.00","$1,016,408.00","$4,269","$4,857"
4,1973,"$1,356,499.70",211349205.0,"$1,001,571.00","$1,133,468.00","$4,739","$5,363"
5,1974,"$1,472,024.20",213333635.0,"$1,094,397.00","$1,244,912.00","$5,130","$5,836"
6,1975,"$1,602,227.60",215456585.0,"$1,215,359.00","$1,362,505.00","$5,641","$6,324"
7,1976,"$1,780,497.30",217553859.0,"$1,323,488.00","$1,495,704.00","$6,083","$6,875"
8,1977,"$1,986,407.70",219760875.0,"$1,454,268.00","$1,651,632.00","$6,618","$7,516"
9,1978,"$2,243,230.10",222098244.0,"$1,626,753.00","$1,855,849.00","$7,324","$8,356"


In [8]:
# Remove 2020 from df
gdp_income_df = gdp_income_df.dropna(axis="rows")

# Change index to year
gdp_income_df = gdp_income_df.set_index("Year")

In [9]:
# Display final, cleaned gdp/income df
gdp_income_df

Unnamed: 0_level_0,GDP (Dollars),Population (No. of People),Disposable Personal Income (Millions of Dollars),Personal Income (Millions of Dollars),Per Capita Disposable Personal Income (Dollars),Per Capita Personal Income (Dollars)
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
1969,"$962,901.70",201298000,"$687,425.00","$791,229.00","$3,415","$3,931"
1970,"$1,012,299.30",203798722,"$753,099.00","$855,525.00","$3,695","$4,198"
1971,"$1,097,173.40",206817509,"$823,437.00","$924,613.00","$3,981","$4,471"
1972,"$1,210,292.40",209274882,"$893,321.00","$1,016,408.00","$4,269","$4,857"
1973,"$1,356,499.70",211349205,"$1,001,571.00","$1,133,468.00","$4,739","$5,363"
1974,"$1,472,024.20",213333635,"$1,094,397.00","$1,244,912.00","$5,130","$5,836"
1975,"$1,602,227.60",215456585,"$1,215,359.00","$1,362,505.00","$5,641","$6,324"
1976,"$1,780,497.30",217553859,"$1,323,488.00","$1,495,704.00","$6,083","$6,875"
1977,"$1,986,407.70",219760875,"$1,454,268.00","$1,651,632.00","$6,618","$7,516"
1978,"$2,243,230.10",222098244,"$1,626,753.00","$1,855,849.00","$7,324","$8,356"


In [10]:
# Export combined df to csv
gdp_income_df.to_csv("Output/gdp_income.csv")

# Export combined df to spreadsheet
gdp_income_df.to_excel("Output/gdp_income.xlsx")