In [1]:
import pandas as pd
from sqlalchemy import create_engine

In [2]:
# Read depression csv and create df
csv_file = "./Resources/adult-depression-lghc-indicator-1.csv"
depression_df = pd.read_csv(csv_file, encoding="latin1")
depression_df.head()

Unnamed: 0,Year,Strata,Strata Name,Frequency,Weighted Frequency,Percent,Lower 95% CL,Upper 95% CL
0,2012,Total,Total,1920,,11.74,11.11,12.37
1,2012,Sex,Male,561,1116664.0,8.12,7.32,8.92
2,2012,Sex,Female,1359,2163108.0,15.25,14.3,16.2
3,2012,Race-Ethnicity,White,1314,1806371.0,14.57,13.67,15.46
4,2012,Race-Ethnicity,Black,97,222022.0,13.54,10.44,16.65


In [3]:
# Read obesity csv and create df
csv_file_2 = "./Resources/Obesity_in_California__2012_and_2013.csv"
obesity_df = pd.read_csv(csv_file_2, encoding="latin1")
obesity_df.head()

Unnamed: 0,Year,Age Group,Category,Type,Obese (%)
0,2012,Adolescent (12-17),All,Total,11.2
1,2012,Adolescent (12-17),Gender,Male,14.6
2,2012,Adolescent (12-17),Gender,Female,7.8
3,2012,Adolescent (12-17),Gender by Age- Male,12-13,15.2
4,2012,Adolescent (12-17),Gender by Age- Male,14-15,14.2


In [4]:
# Rename depression df columns
depression = depression_df.rename(columns = {"Year": "study_year",
                                            "Strata":"strata", "Strata Name":"strata_type",
                                            "Frequency":"frequency","Weighted Frequency":"weighted_frequency",
                                           "Percent":"percent", "Lower 95% CL":"lower_95", "Upper 95% CL":"upper_95"})
depression.head()

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
0,2012,Total,Total,1920,,11.74,11.11,12.37
1,2012,Sex,Male,561,1116664.0,8.12,7.32,8.92
2,2012,Sex,Female,1359,2163108.0,15.25,14.3,16.2
3,2012,Race-Ethnicity,White,1314,1806371.0,14.57,13.67,15.46
4,2012,Race-Ethnicity,Black,97,222022.0,13.54,10.44,16.65


In [5]:
# Rename obesity df columns
obesity = obesity_df.rename(columns = {"Year": "study_year", "Age Group":"age_group",
                                            "Category":"strata", "Type":"strata_type",
                                            "Obese (%)":"obesity"})
obesity.head()

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
0,2012,Adolescent (12-17),All,Total,11.2
1,2012,Adolescent (12-17),Gender,Male,14.6
2,2012,Adolescent (12-17),Gender,Female,7.8
3,2012,Adolescent (12-17),Gender by Age- Male,12-13,15.2
4,2012,Adolescent (12-17),Gender by Age- Male,14-15,14.2


In [6]:
# Filter by study year (2012-2013) for obesity df
obesity = obesity.loc[obesity['study_year'].isin([2013])]
obesity

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
24,2013,Adult (18+),All,Total,30.2
25,2013,Adult (18+),Gender,Male,26.5
26,2013,Adult (18+),Gender,Female,33.9
27,2013,Adult (18+),Age,18 - 24,21.1
28,2013,Adult (18+),Age,25 - 34,30.6
29,2013,Adult (18+),Age,35 - 50,33.4
30,2013,Adult (18+),Age,51 - 64,35.2
31,2013,Adult (18+),Age,65+,25.2
32,2013,Adult (18+),Ethnicity,White,27.1
33,2013,Adult (18+),Ethnicity,African American,44.2


In [7]:
# Filter by study year (2012-2013) for depression df
depression = depression.loc[depression['study_year'].isin([2013])]
depression

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
23,2013,Total,Total,1689,,13.08,12.33,13.82
24,2013,Sex,Male,539,1307668.0,9.53,8.53,10.52
25,2013,Sex,Female,1150,2337817.0,16.52,15.42,17.62
26,2013,Race-Ethnicity,White,1103,1979888.0,15.97,14.91,17.02
27,2013,Race-Ethnicity,Black,93,252871.0,15.46,11.91,19.02
28,2013,Race-Ethnicity,Hispanic,403,1011594.0,10.96,9.72,12.2
29,2013,Race-Ethnicity,Asian/Pacific Islander,62,308822.0,7.38,5.26,9.5
30,2013,Race-Ethnicity,Other,28,92309.0,21.63,12.57,30.69
31,2013,Education,No High School Diploma,222,510371.0,12.84,10.87,14.81
32,2013,Education,High School Graduate or GED Certificate,361,841995.0,14.28,12.5,16.06


In [8]:
# Filter by age group (Adult 18+) for obesity df
new_obesity = obesity.loc[obesity['age_group'] == "Adult (18+)"]
new_obesity

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
24,2013,Adult (18+),All,Total,30.2
25,2013,Adult (18+),Gender,Male,26.5
26,2013,Adult (18+),Gender,Female,33.9
27,2013,Adult (18+),Age,18 - 24,21.1
28,2013,Adult (18+),Age,25 - 34,30.6
29,2013,Adult (18+),Age,35 - 50,33.4
30,2013,Adult (18+),Age,51 - 64,35.2
31,2013,Adult (18+),Age,65+,25.2
32,2013,Adult (18+),Ethnicity,White,27.1
33,2013,Adult (18+),Ethnicity,African American,44.2


In [9]:
# Get age group (Adult 18+) rows in obesity df to change
obesity_change1 = obesity.loc[obesity['strata_type'].isin(["18 - 24", "25 - 34", "35 - 50", "51 - 64"])]
obesity_change1

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
27,2013,Adult (18+),Age,18 - 24,21.1
28,2013,Adult (18+),Age,25 - 34,30.6
29,2013,Adult (18+),Age,35 - 50,33.4
30,2013,Adult (18+),Age,51 - 64,35.2


In [10]:
# Create new rows that combine data (average)
obesity_change1.loc[31] = [2013, "Adult (18+)", "Age", "18 - 34", (obesity_change1.loc[27,'obesity'] + obesity_change1.loc[28,'obesity'])/2]
obesity_change1.loc[32] = [2013, "Adult (18+)", "Age", "35 - 64", (obesity_change1.loc[29,'obesity'] + obesity_change1.loc[30,'obesity'])/2]
obesity_change1

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  This is separate from the ipykernel package so we can avoid doing imports until


Unnamed: 0,study_year,age_group,strata,strata_type,obesity
27,2013,Adult (18+),Age,18 - 24,21.1
28,2013,Adult (18+),Age,25 - 34,30.6
29,2013,Adult (18+),Age,35 - 50,33.4
30,2013,Adult (18+),Age,51 - 64,35.2
31,2013,Adult (18+),Age,18 - 34,25.85
32,2013,Adult (18+),Age,35 - 64,34.3


In [11]:
# Remove old age group rows (27, 28, 29, 30), and insert new rows into table (add 27, 28). Sort index. 
new_obesity2 = new_obesity.drop([27, 28, 29, 30])
new_obesity2.loc[27] = obesity_change1.loc[31]
new_obesity2.loc[28] = obesity_change1.loc[32]
new_obesity2 = new_obesity2.sort_index()
new_obesity2

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
24,2013,Adult (18+),All,Total,30.2
25,2013,Adult (18+),Gender,Male,26.5
26,2013,Adult (18+),Gender,Female,33.9
27,2013,Adult (18+),Age,18 - 34,25.85
28,2013,Adult (18+),Age,35 - 64,34.3
31,2013,Adult (18+),Age,65+,25.2
32,2013,Adult (18+),Ethnicity,White,27.1
33,2013,Adult (18+),Ethnicity,African American,44.2
34,2013,Adult (18+),Ethnicity,Latino,34.0
35,2013,Adult (18+),Ethnicity,Asian/Other,23.9


In [12]:
# Get income rows in obesity df to change
obesity_change2 = obesity.loc[obesity['strata_type'].isin(["Less than $15,000", "$15,000 - 24,999", "$25,000 - 34,999"])]
obesity_change2

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
40,2013,Adult (18+),Income,"Less than $15,000",32.4
41,2013,Adult (18+),Income,"$15,000 - 24,999",37.7
42,2013,Adult (18+),Income,"$25,000 - 34,999",28.1


In [13]:
# Create new row that combines data (average)
obesity_change2.loc[43] = [2013, "Adult (18+)", "Income", "< $35,000", (obesity_change2.loc[40,'obesity'] + obesity_change2.loc[41,'obesity'] + obesity_change2.loc[42,'obesity'])/3]
obesity_change2

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  


Unnamed: 0,study_year,age_group,strata,strata_type,obesity
40,2013,Adult (18+),Income,"Less than $15,000",32.4
41,2013,Adult (18+),Income,"$15,000 - 24,999",37.7
42,2013,Adult (18+),Income,"$25,000 - 34,999",28.1
43,2013,Adult (18+),Income,"< $35,000",32.733333


In [14]:
# Remove old rows (40, 41, 42), and insert new row into table (add 40). Sort index. 
new_obesity3 = new_obesity2.drop([40, 41, 42])
new_obesity3.loc[40] = obesity_change2.loc[43]
edited_obesity = new_obesity3.sort_index()
edited_obesity

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
24,2013,Adult (18+),All,Total,30.2
25,2013,Adult (18+),Gender,Male,26.5
26,2013,Adult (18+),Gender,Female,33.9
27,2013,Adult (18+),Age,18 - 34,25.85
28,2013,Adult (18+),Age,35 - 64,34.3
31,2013,Adult (18+),Age,65+,25.2
32,2013,Adult (18+),Ethnicity,White,27.1
33,2013,Adult (18+),Ethnicity,African American,44.2
34,2013,Adult (18+),Ethnicity,Latino,34.0
35,2013,Adult (18+),Ethnicity,Asian/Other,23.9


In [15]:
# Get race/ethnicity rows in depression df to change
depression_change1 = depression.loc[depression['strata_type'].isin(["Asian/Pacific Islander", "Other"])]
depression_change1

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
29,2013,Race-Ethnicity,Asian/Pacific Islander,62,308822.0,7.38,5.26,9.5
30,2013,Race-Ethnicity,Other,28,92309.0,21.63,12.57,30.69


In [16]:
# Create new row that combines data (frequncy sum and average for other stats)
depression_change1.loc[31] = [2013, "Race-Ethnicity", "Asian/Other",
    depression_change1.loc[29,'frequency'] + depression_change1.loc[30,'frequency'],
    (depression_change1.loc[29,'weighted_frequency'] + depression_change1.loc[30,'weighted_frequency'])/2,
    (depression_change1.loc[29,'percent'] + depression_change1.loc[30,'percent'])/2,
    (depression_change1.loc[29,'lower_95'] + depression_change1.loc[30,'lower_95'])/2,
    (depression_change1.loc[29,'upper_95'] + depression_change1.loc[30,'upper_95'])/2,
    ]
depression_change1

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  import sys


Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
29,2013,Race-Ethnicity,Asian/Pacific Islander,62,308822.0,7.38,5.26,9.5
30,2013,Race-Ethnicity,Other,28,92309.0,21.63,12.57,30.69
31,2013,Race-Ethnicity,Asian/Other,90,200565.5,14.505,8.915,20.095


In [17]:
# Remove old rows (29, 30), and insert new row into table (add 29). Sort index. 
new_depression = depression.drop([29, 30])
new_depression.loc[29] = depression_change1.loc[31]
new_depression = new_depression.sort_index()
new_depression

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
23,2013,Total,Total,1689,,13.08,12.33,13.82
24,2013,Sex,Male,539,1307668.0,9.53,8.53,10.52
25,2013,Sex,Female,1150,2337817.0,16.52,15.42,17.62
26,2013,Race-Ethnicity,White,1103,1979888.0,15.97,14.91,17.02
27,2013,Race-Ethnicity,Black,93,252871.0,15.46,11.91,19.02
28,2013,Race-Ethnicity,Hispanic,403,1011594.0,10.96,9.72,12.2
29,2013,Race-Ethnicity,Asian/Other,90,200565.5,14.505,8.915,20.095
31,2013,Education,No High School Diploma,222,510371.0,12.84,10.87,14.81
32,2013,Education,High School Graduate or GED Certificate,361,841995.0,14.28,12.5,16.06
33,2013,Education,Some College or Tech School,504,1069791.0,15.37,13.81,16.93


In [18]:
# Get age group rows in depression df to change
depression_change2 = depression.loc[depression['strata_type'].isin(["35 to 44", "45 to 54", "55 to 64"])]
depression_change2

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
42,2013,Age,35 to 44,198,538114.0,10.42,8.84,11.99
43,2013,Age,45 to 54,347,880554.0,16.81,14.85,18.77
44,2013,Age,55 to 64,456,741063.0,18.39,16.6,20.18


In [19]:
# Create new row that combines data (frequncy sum and average for other stats)
depression_change2.loc[45] = [2013, "Age", "35 to 64",
    depression_change2.loc[42,'frequency'] + depression_change2.loc[43,'frequency'] + depression_change2.loc[44,'frequency'],
    (depression_change2.loc[42,'weighted_frequency'] + depression_change2.loc[43,'weighted_frequency'] + depression_change2.loc[44,'weighted_frequency'])/3,
    (depression_change2.loc[42,'percent'] + depression_change2.loc[43,'percent'] + depression_change2.loc[43,'percent'])/3,
    (depression_change2.loc[42,'lower_95'] + depression_change2.loc[43,'lower_95'] + depression_change2.loc[44,'lower_95'])/3,
    (depression_change2.loc[42,'upper_95'] + depression_change2.loc[43,'upper_95'] + depression_change2.loc[44,'upper_95'])/3,
    ]
depression_change2

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  import sys


Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
42,2013,Age,35 to 44,198,538114.0,10.42,8.84,11.99
43,2013,Age,45 to 54,347,880554.0,16.81,14.85,18.77
44,2013,Age,55 to 64,456,741063.0,18.39,16.6,20.18
45,2013,Age,35 to 64,1001,719910.333333,14.68,13.43,16.98


In [20]:
# Remove old rows (42, 43, 44), and insert new row into table (add 42). Sort index. 
new_depression2 = new_depression.drop([42, 43, 44])
new_depression2.loc[42] = depression_change2.loc[45]
new_depression2 = new_depression2.sort_index()
new_depression2

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
23,2013,Total,Total,1689,,13.08,12.33,13.82
24,2013,Sex,Male,539,1307668.0,9.53,8.53,10.52
25,2013,Sex,Female,1150,2337817.0,16.52,15.42,17.62
26,2013,Race-Ethnicity,White,1103,1979888.0,15.97,14.91,17.02
27,2013,Race-Ethnicity,Black,93,252871.0,15.46,11.91,19.02
28,2013,Race-Ethnicity,Hispanic,403,1011594.0,10.96,9.72,12.2
29,2013,Race-Ethnicity,Asian/Other,90,200565.5,14.505,8.915,20.095
31,2013,Education,No High School Diploma,222,510371.0,12.84,10.87,14.81
32,2013,Education,High School Graduate or GED Certificate,361,841995.0,14.28,12.5,16.06
33,2013,Education,Some College or Tech School,504,1069791.0,15.37,13.81,16.93


In [21]:
# Get income rows in depression df to change
depression_change3 = depression.loc[depression['strata_type'].isin(["< $20,000", "$20,000 - $34,999",
         "$35,000 - $49,999", "$50,000 - $74,999","$75,000 - $99,999","$100,000+"])]
depression_change3

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
35,2013,Income,"< $20,000",600,1286100.0,18.63,16.89,20.38
36,2013,Income,"$20,000 - $34,999",283,560739.0,14.57,12.5,16.64
37,2013,Income,"$35,000 - $49,999",149,305677.0,11.29,8.89,13.68
38,2013,Income,"$50,000 - $74,999",186,394993.0,12.26,10.17,14.34
39,2013,Income,"$75,000 - $99,999",155,321528.0,12.04,9.88,14.2
40,2013,Income,"$100,000+",213,541245.0,9.89,8.34,11.44


In [22]:
# Create new rows that combines data (frequncy sum and average for other stats)
# < $35,000 income group
depression_change3.loc[41] = [2013, "Income", "< $35,000",
    depression_change3.loc[35,'frequency'] + depression_change3.loc[36,'frequency'],
    (depression_change3.loc[35,'weighted_frequency'] + depression_change3.loc[36,'weighted_frequency'])/2,
    (depression_change3.loc[35,'percent'] + depression_change3.loc[36,'percent'])/2,
    (depression_change3.loc[35,'lower_95'] + depression_change3.loc[36,'lower_95'])/2,
    (depression_change3.loc[35,'upper_95'] + depression_change3.loc[36,'upper_95'])/2,
    ]

# $50,000+ income group
depression_change3.loc[42] = [2013, "Income", "$50,000+",
    depression_change3.loc[38,'frequency'] + depression_change3.loc[39,'frequency'] + depression_change3.loc[40,'frequency'],
    (depression_change3.loc[38,'weighted_frequency'] + depression_change3.loc[39,'weighted_frequency'] + depression_change3.loc[40,'weighted_frequency'])/3,
    (depression_change3.loc[38,'percent'] + depression_change3.loc[39,'percent'] + depression_change3.loc[40,'percent'])/3,
    (depression_change3.loc[38,'lower_95'] + depression_change3.loc[39,'lower_95'] + depression_change3.loc[40,'lower_95'])/3,
    (depression_change3.loc[38,'upper_95'] + depression_change3.loc[39,'upper_95'] + depression_change3.loc[40,'upper_95'])/3,
    ]

depression_change3

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy


Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
35,2013,Income,"< $20,000",600,1286100.0,18.63,16.89,20.38
36,2013,Income,"$20,000 - $34,999",283,560739.0,14.57,12.5,16.64
37,2013,Income,"$35,000 - $49,999",149,305677.0,11.29,8.89,13.68
38,2013,Income,"$50,000 - $74,999",186,394993.0,12.26,10.17,14.34
39,2013,Income,"$75,000 - $99,999",155,321528.0,12.04,9.88,14.2
40,2013,Income,"$100,000+",213,541245.0,9.89,8.34,11.44
41,2013,Income,"< $35,000",883,923419.5,16.6,14.695,18.51
42,2013,Income,"$50,000+",554,419255.3,11.396667,9.463333,13.326667


In [23]:
# Remove old rows (35, 35, 38, 39, 40), and insert new rows into table (add 35, 38). Sort index. 
new_depression3 = new_depression2.drop([35, 36, 38, 39, 40])
new_depression3.loc[35] = depression_change3.loc[41]
new_depression3.loc[38] = depression_change3.loc[42]
edited_depression = new_depression3.sort_index()
edited_depression

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
23,2013,Total,Total,1689,,13.08,12.33,13.82
24,2013,Sex,Male,539,1307668.0,9.53,8.53,10.52
25,2013,Sex,Female,1150,2337817.0,16.52,15.42,17.62
26,2013,Race-Ethnicity,White,1103,1979888.0,15.97,14.91,17.02
27,2013,Race-Ethnicity,Black,93,252871.0,15.46,11.91,19.02
28,2013,Race-Ethnicity,Hispanic,403,1011594.0,10.96,9.72,12.2
29,2013,Race-Ethnicity,Asian/Other,90,200565.5,14.505,8.915,20.095
31,2013,Education,No High School Diploma,222,510371.0,12.84,10.87,14.81
32,2013,Education,High School Graduate or GED Certificate,361,841995.0,14.28,12.5,16.06
33,2013,Education,Some College or Tech School,504,1069791.0,15.37,13.81,16.93


In [54]:
# Rename education strata types for obesity df
edited_obesity = edited_obesity.replace(
    {"Less than High School" : "No High School Diploma", 
     "High School Graduate" : "High School Graduate or GED Certificate", 
     "Some College" : "Some College or Tech School",
     "College Graduate" : "College Graduate or Post Grad"})
edited_obesity.reset_index(drop=True, inplace=True)
edited_obesity

Unnamed: 0,study_year,age_group,strata,strata_type,obesity
0,2013,Adult (18+),All,Total,30.2
1,2013,Adult (18+),Gender,Male,26.5
2,2013,Adult (18+),Gender,Female,33.9
3,2013,Adult (18+),Age,18 - 34,25.85
4,2013,Adult (18+),Age,35 - 64,34.3
5,2013,Adult (18+),Age,65+,25.2
6,2013,Adult (18+),Ethnicity,White,27.1
7,2013,Adult (18+),Ethnicity,African American,44.2
8,2013,Adult (18+),Ethnicity,Latino,34.0
9,2013,Adult (18+),Ethnicity,Asian/Other,23.9


In [55]:
# Rename gender, income, age, and race/ethnicity strata types for depression df
edited_depression = edited_depression.replace(
    {"Sex" : "Gender", 
     "$35,000 - $49,999": "$35,000 - 49,999",
     "18 to 34" : "18 - 34",
     "35 to 64" : "35 - 64",
     "65+ years" : "65+",
     "Race-Ethnicity" : "Ethnicity",
     "Black" : "African American", 
     "Asian/Pacific Islander" : "Asian/Other", 
     "Hispanic" : "Latino"})
edited_depression.reset_index(drop=True, inplace=True)
edited_depression

Unnamed: 0,study_year,strata,strata_type,frequency,weighted_frequency,percent,lower_95,upper_95
0,2013,Total,Total,1689,,13.08,12.33,13.82
1,2013,Gender,Male,539,1307668.0,9.53,8.53,10.52
2,2013,Gender,Female,1150,2337817.0,16.52,15.42,17.62
3,2013,Ethnicity,White,1103,1979888.0,15.97,14.91,17.02
4,2013,Ethnicity,African American,93,252871.0,15.46,11.91,19.02
5,2013,Ethnicity,Latino,403,1011594.0,10.96,9.72,12.2
6,2013,Ethnicity,Asian/Other,90,200565.5,14.505,8.915,20.095
7,2013,Education,No High School Diploma,222,510371.0,12.84,10.87,14.81
8,2013,Education,High School Graduate or GED Certificate,361,841995.0,14.28,12.5,16.06
9,2013,Education,Some College or Tech School,504,1069791.0,15.37,13.81,16.93


In [56]:
# Connect to database
rds_connection_string = "root:<password>@127.0.0.1/obesity_depression_db"
engine = create_engine(f'mysql://{rds_connection_string}')

In [27]:
# Check table names
engine.table_names()

['depression', 'obesity']

In [57]:
# Transfer edited depression data to depression table in database
edited_depression.to_sql(name='depression', con=engine, if_exists='append', index=False)

In [58]:
# Transfer edited obesity data to obesity table in database
edited_obesity.to_sql(name='obesity', con=engine, if_exists='append', index=False)