# Cleaned and merged OSMI yearly data

## Module and file imports

In [21]:
import pandas as pd
from IPython.display import display, HTML

In [22]:
df_cleaned = pd.read_csv('../OSMI Raw Data/OSMI_merged.csv')
df_2017 =    pd.read_csv('../OSMI Raw Data/OSMI_Mental_Health_in_Tech_Survey_2017.csv')
df_2018 =    pd.read_csv('../OSMI Raw Data/OSMI_Mental_Health_in_Tech_Survey_2018.csv')
df_2019 =    pd.read_csv('../OSMI Raw Data/OSMI_2019_Mental_Health_in_Tech_Survey_Results.csv')
df_2020 =    pd.read_csv('../OSMI Raw Data/OSMI_2020_Mental_Health_in_Tech_Survey.csv')
df_2021 =    pd.read_csv('../OSMI Raw Data/OSMI_2021_Mental_Health_in_Tech_Survey.csv')

### Initial look at potential to merge automatedly

Findings are that numerous column names vary slightly between years - manual renaming needed

In [23]:
# Get the sum of rowsfrom yearly data
total_row_length = sum(len(df) for df in [df_2017, df_2018, df_2019, df_2020, df_2021])
total_row_length

# compare to pre-merged

1836

In [24]:
# Get the sum of unique columns from yearly data

unique_columns = set()

# Add unique columns from each DataFrame to the set
for df in [df_2017, df_2018, df_2019, df_2020, df_2021]:
    unique_columns.update(df.columns)

total_unique_columns = len(unique_columns)

total_unique_columns



151

In [25]:
common_columns = set(df_2017.columns)

for df in [df_2018, df_2019, df_2020, df_2021]:
    common_columns = common_columns.intersection(df.columns)

total_common_columns = len(common_columns)
total_common_columns

58

## Prepping data sets for merge

### 2017 column reduction and renaming

In [26]:
df_2017.columns.tolist()

['#',
 '<strong>Are you self-employed?</strong>',
 'How many employees does your company or organization have?',
 'Is your employer primarily a tech company/organization?',
 'Is your primary role within your company related to tech/IT?',
 'Does your employer provide mental health benefits\xa0as part of healthcare coverage?',
 'Do you know the options for mental health care available under your employer-provided health coverage?',
 'Has your employer ever formally discussed mental health (for example, as part of a wellness campaign or other official communication)?',
 'Does your employer offer resources to learn more about mental health disorders and options for seeking help?',
 'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?',
 'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?',
 'Would you feel more comforta

In [27]:
# Choosing 2017 columns
df_2017_reduced = df_2017[['Is your employer primarily a tech company/organization?',
                           'Does your employer provide mental health benefits\xa0as part of healthcare coverage?',
                           'Do you know the options for mental health care available under your employer-provided health coverage?',
                           'Do you currently have a mental health disorder?',
                           'Have you ever been diagnosed with a mental health disorder?',
                           'Do you have a family history of mental illness?',
                           'Have you ever discussed your mental health with your employer?',
                           'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?',
                           'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?',
                           'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?',
                           'Would you feel comfortable discussing a mental health issue with your coworkers?',
                           'How many employees does your company or organization have?',
                           'Overall, how well do you think the tech industry supports employees with mental health issues?',
                           '<strong>Have you observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?</strong>',
                           '<strong>Have you observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace?</strong>',
                           'What is your age?',
                           'What is your gender?',
                           'What country do you <strong>live</strong> in?',
                           'What is your race?',
                           'Start Date (UTC)',
                           'Submit Date (UTC)',
                           ]]



In [28]:

# Renaming 2017 columns
df_2017_reduced = df_2017_reduced.rename(columns={'Is your employer primarily a tech company/organization?': 'tech company',
                                                  'Does your employer provide mental health benefits\xa0as part of healthcare coverage?': 'employer provided healthcare with mental benefits',
                                                  'Do you know the options for mental health care available under your employer-provided health coverage?': 'employer provided mental healthcare awareness',
                                                  'Do you currently have a mental health disorder?': 'current mental health disorder',
                                                  'Have you ever been diagnosed with a mental health disorder?': 'mental health diagnosis',
                                                  'Do you have a family history of mental illness?': 'family history of mental illness',
                                                  'Have you ever discussed your mental health with your employer?': 'discussed personal mental health with employer',
                                                  'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?': 'anonymity protected when using benefits',
                                                  'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?': 'ease of asking for leave',
                                                  'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?': 'comfortable discussing a mental health issue with direct supervisor(s)',
                                                  'Would you feel comfortable discussing a mental health issue with your coworkers?': 'comfortable discussing a mental health issue with coworkers',
                                                  'How many employees does your company or organization have?': 'Number of employees',
                                                  'Overall, how well do you think the tech industry supports employees with mental health issues?': 'how well do you think the tech industry supports employees with mental health issues',
                                                  '<strong>Have you observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?</strong>': 'observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?',
                                                  '<strong>Have you observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace?</strong>': 'observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace',
                                                  'What is your age?': 'Age',
                                                  'What is your gender?': 'Gender',
                                                  'What country do you <strong>live</strong> in?': 'Country of residence',
                                                  'What is your race?': 'Race'
})

# column_names = df_2017_columns.columns.tolist()
# column_names
df_2017_reduced.head()

Unnamed: 0,tech company,employer provided healthcare with mental benefits,employer provided mental healthcare awareness,current mental health disorder,mental health diagnosis,family history of mental illness,discussed personal mental health with employer,anonymity protected when using benefits,ease of asking for leave,comfortable discussing a mental health issue with direct supervisor(s),...,Number of employees,how well do you think the tech industry supports employees with mental health issues,observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?,observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace,Age,Gender,Country of residence,Race,Start Date (UTC),Submit Date (UTC)
0,1.0,No,Yes,Possibly,,No,0.0,I don't know,I don't know,Yes,...,100-500,1.0,"Yes, I experienced","Yes, I experienced",27.0,Female,United Kingdom,,2018-05-16 12:32:04,2018-05-16 12:42:40
1,1.0,Yes,Yes,Possibly,,No,0.0,I don't know,I don't know,Maybe,...,100-500,2.0,"Yes, I observed",Maybe/Not sure,31.0,male,United Kingdom,,2018-05-16 12:31:13,2018-05-16 12:40:40
2,1.0,I don't know,No,Yes,Yes,Yes,1.0,Yes,Difficult,Yes,...,6-25,1.0,"Yes, I experienced","Yes, I experienced",36.0,male,United States of America,White,2018-05-09 05:34:05,2018-05-09 05:46:04
3,1.0,Yes,Yes,Yes,Yes,I don't know,1.0,Yes,Difficult,Yes,...,More than 1000,2.0,Maybe/Not sure,Maybe/Not sure,22.0,Male,United States of America,White,2018-05-04 23:19:14,2018-05-04 23:23:23
4,,,,No,,Yes,,,,,...,,1.0,No,"Yes, I observed",52.0,female,United States of America,More than one of the above,2018-05-03 00:40:24,2018-05-03 00:53:20


In [29]:
# Display entire dataframe
html = df_2017_reduced.to_html()
display(HTML('<div style="max-height: 600px; overflow: auto;">' + html + '</div>'))

Unnamed: 0,tech company,employer provided healthcare with mental benefits,employer provided mental healthcare awareness,current mental health disorder,mental health diagnosis,family history of mental illness,discussed personal mental health with employer,anonymity protected when using benefits,ease of asking for leave,comfortable discussing a mental health issue with direct supervisor(s),comfortable discussing a mental health issue with coworkers,Number of employees,how well do you think the tech industry supports employees with mental health issues,observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?,observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace,Age,Gender,Country of residence,Race,Start Date (UTC),Submit Date (UTC)
0,1.0,No,Yes,Possibly,,No,0.0,I don't know,I don't know,Yes,Yes,100-500,1.0,"Yes, I experienced","Yes, I experienced",27.0,Female,United Kingdom,,2018-05-16 12:32:04,2018-05-16 12:42:40
1,1.0,Yes,Yes,Possibly,,No,0.0,I don't know,I don't know,Maybe,Yes,100-500,2.0,"Yes, I observed",Maybe/Not sure,31.0,male,United Kingdom,,2018-05-16 12:31:13,2018-05-16 12:40:40
2,1.0,I don't know,No,Yes,Yes,Yes,1.0,Yes,Difficult,Yes,Maybe,6-25,1.0,"Yes, I experienced","Yes, I experienced",36.0,male,United States of America,White,2018-05-09 05:34:05,2018-05-09 05:46:04
3,1.0,Yes,Yes,Yes,Yes,I don't know,1.0,Yes,Difficult,Yes,Yes,More than 1000,2.0,Maybe/Not sure,Maybe/Not sure,22.0,Male,United States of America,White,2018-05-04 23:19:14,2018-05-04 23:23:23
4,,,,No,,Yes,,,,,,,1.0,No,"Yes, I observed",52.0,female,United States of America,More than one of the above,2018-05-03 00:40:24,2018-05-03 00:53:20
5,1.0,Yes,No,No,,Yes,0.0,Yes,Somewhat easy,Maybe,Maybe,100-500,2.0,"Yes, I observed","Yes, I observed",30.0,male,United States of America,White,2018-05-01 22:53:02,2018-05-01 22:59:21
6,1.0,Yes,Yes,Yes,Yes,Yes,0.0,Yes,Very easy,Yes,No,6-25,2.0,No,"Yes, I observed",36.0,F,United States of America,Asian,2018-04-28 20:02:22,2018-04-28 20:12:23
7,1.0,Yes,No,No,,Yes,0.0,I don't know,Somewhat easy,Yes,Maybe,26-100,2.0,No,"Yes, I observed",38.0,Female,United States of America,White,2018-04-27 17:42:55,2018-04-27 17:50:41
8,0.0,I don't know,No,Don't Know,,I don't know,0.0,Yes,Very easy,Maybe,Maybe,100-500,2.0,No,"Yes, I experienced",35.0,Male,Switzerland,,2018-04-26 22:35:49,2018-04-26 22:46:46
9,,,,Possibly,,No,,,,,,,3.0,"Yes, I experienced","Yes, I experienced",36.0,male,India,,2018-04-25 07:18:35,2018-04-25 07:22:44


### 2018

In [30]:
# Choosing 2018 columns
df_2018_reduced = df_2018[['Is your employer primarily a tech company/organization?',
                           'Does your employer provide mental health benefits as part of healthcare coverage?',
                           'Do you know the options for mental health care available under your employer-provided health coverage?',
                           'Do you currently have a mental health disorder?',
                           'Have you ever been diagnosed with a mental health disorder?',
                           'Do you have a family history of mental illness?',
                           'Have you ever discussed your mental health with your employer?',
                           'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?',
                           'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?',
                           'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?',
                           'Would you feel comfortable discussing a mental health issue with your coworkers?',
                           'How many employees does your company or organization have?',
                           'Overall, how well do you think the tech industry supports employees with mental health issues?',
                           '<strong>Have you observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?</strong>',
                           '<strong>Have you observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace?</strong>',
                           'What is your age?',
                           'What is your gender?',
                           'What country do you <strong>live</strong> in?',
                           'What is your race?',
                           'Start Date (UTC)',
                           'Submit Date (UTC)',
                           ]]


In [31]:
df_2018_reduced = df_2018_reduced.rename(columns={'Is your employer primarily a tech company/organization?': 'tech company',
                                                  'Does your employer provide mental health benefits as part of healthcare coverage?': 'employer provided healthcare with mental benefits',
                                                  'Do you know the options for mental health care available under your employer-provided health coverage?': 'employer provided mental healthcare awareness',
                                                  'Do you currently have a mental health disorder?': 'current mental health disorder',
                                                  'Have you ever been diagnosed with a mental health disorder?': 'mental health diagnosis',
                                                  'Do you have a family history of mental illness?': 'family history of mental illness',
                                                  'Have you ever discussed your mental health with your employer?': 'discussed personal mental health with employer',
                                                  'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?': 'anonymity protected when using benefits',
                                                  'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?': 'ease of asking for leave',
                                                  'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?': 'comfortable discussing a mental health issue with direct supervisor(s)',
                                                  'Would you feel comfortable discussing a mental health issue with your coworkers?': 'comfortable discussing a mental health issue with coworkers',
                                                  'How many employees does your company or organization have?': 'Number of employees',
                                                  'Overall, how well do you think the tech industry supports employees with mental health issues?': 'how well do you think the tech industry supports employees with mental health issues',
                                                  '<strong>Have you observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?</strong>': 'observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?',
                                                  '<strong>Have you observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace?</strong>': 'observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace',
                                                  'What is your age?': 'Age',
                                                  'What is your gender?': 'Gender',
                                                  'What country do you <strong>live</strong> in?': 'Country of residence',
                                                  'What is your race?': 'Race'
})

### 2019

In [32]:
# Choosing 2019 columns !!! NO DATE INFO (perhaps add year and clean other years to just year)
df_2019_reduced = df_2019[['Is your employer primarily a tech company/organization?',
                           'Does your employer provide mental health benefits as part of healthcare coverage?',
                           'Do you know the options for mental health care available under your employer-provided health coverage?',
                            'Do you *currently* have a mental health disorder?',
                            'Have you ever been *diagnosed* with a mental health disorder?',
                           'Do you have a family history of mental illness?',
                           'Have you ever discussed your mental health with your employer?',
                           'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?',
                           'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?',
                           'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?',
                           'Would you feel comfortable discussing a mental health issue with your coworkers?',
                           'How many employees does your company or organization have?',
                           'Overall, how well do you think the tech industry supports employees with mental health issues?',
                           'Have you observed or experienced an *unsupportive or badly handled response* to a mental health issue in your current or previous workplace?',
                           'Have you observed or experienced a *supportive or well handled response* to a mental health issue in your current or previous workplace?',
                           'What is your age?',
                           'What is your gender?',
                           'What country do you *live* in?',
                           'What is your race?',
                           ]]

In [33]:
df_2019_reduced = df_2019_reduced.rename(columns={'Is your employer primarily a tech company/organization?': 'tech company',
                                                  'Does your employer provide mental health benefits as part of healthcare coverage?': 'employer provided healthcare with mental benefits',
                                                  'Do you know the options for mental health care available under your employer-provided health coverage?': 'employer provided mental healthcare awareness',
                                                  'Do you currently have a mental health disorder?': 'current mental health disorder',
                                                  'Have you ever been diagnosed with a mental health disorder?': 'mental health diagnosis',
                                                  'Do you have a family history of mental illness?': 'family history of mental illness',
                                                  'Have you ever discussed your mental health with your employer?': 'discussed personal mental health with employer',
                                                  'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?': 'anonymity protected when using benefits',
                                                  'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?': 'ease of asking for leave',
                                                  'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?': 'comfortable discussing a mental health issue with direct supervisor(s)',
                                                  'Would you feel comfortable discussing a mental health issue with your coworkers?': 'comfortable discussing a mental health issue with coworkers',
                                                  'How many employees does your company or organization have?': 'Number of employees',
                                                  'Overall, how well do you think the tech industry supports employees with mental health issues?': 'how well do you think the tech industry supports employees with mental health issues',
                                                  '<strong>Have you observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?</strong>': 'observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?',
                                                  '<strong>Have you observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace?</strong>': 'observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace',
                                                  'What is your age?': 'Age',
                                                  'What is your gender?': 'Gender',
                                                  'What country do you <strong>live</strong> in?': 'Country of residence',
                                                  'What is your race?': 'Race'
})

### 2020

In [34]:
# choosing 2020 columns
df_2020_reduced = df_2020[['Is your employer primarily a tech company/organization?',
                           'Does your employer provide mental health benefits as part of healthcare coverage?',
                           'Do you know the options for mental health care available under your employer-provided health coverage?',
                            'Do you *currently* have a mental health disorder?',
                            'Have you ever been *diagnosed* with a mental health disorder?',
                           'Do you have a family history of mental illness?',
                           'Have you ever discussed your mental health with your employer?',
                           'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?',
                           'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?',
                           'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?',
                           'Would you feel comfortable discussing a mental health issue with your coworkers?',
                           'How many employees does your company or organization have?',
                           'Overall, how well do you think the tech industry supports employees with mental health issues?',
                           'Have you observed or experienced an *unsupportive or badly handled response* to a mental health issue in your current or previous workplace?',
                           'Have you observed or experienced a *supportive or well handled response* to a mental health issue in your current or previous workplace?',
                           'What is your age?',
                           'What is your gender?',
                           'What country do you *live* in?',
                           'What is your race?',
                           ]]

In [35]:
df_2020_reduced = df_2020_reduced.rename(columns={'Is your employer primarily a tech company/organization?': 'tech company',
                                                  'Does your employer provide mental health benefits as part of healthcare coverage?': 'employer provided healthcare with mental benefits',
                                                  'Do you know the options for mental health care available under your employer-provided health coverage?': 'employer provided mental healthcare awareness',
                                                  'Do you *currently* have a mental health disorder?': 'current mental health disorder',
                                                  'Have you ever been *diagnosed* with a mental health disorder?': 'mental health diagnosis',
                                                  'Do you have a family history of mental illness?': 'family history of mental illness',
                                                  'Have you ever discussed your mental health with your employer?': 'discussed personal mental health with employer',
                                                  'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?': 'anonymity protected when using benefits',
                                                  'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?': 'ease of asking for leave',
                                                  'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?': 'comfortable discussing a mental health issue with direct supervisor(s)',
                                                  'Would you feel comfortable discussing a mental health issue with your coworkers?': 'comfortable discussing a mental health issue with coworkers',
                                                  'How many employees does your company or organization have?': 'Number of employees',
                                                  'Overall, how well do you think the tech industry supports employees with mental health issues?': 'how well do you think the tech industry supports employees with mental health issues',
                                                  'Have you observed or experienced an *unsupportive or badly handled response* to a mental health issue in your current or previous workplace?': 'observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?',
                                                  'Have you observed or experienced a *supportive or well handled response* to a mental health issue in your current or previous workplace?': 'observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace',
                                                  'What is your age?': 'Age',
                                                  'What is your gender?': 'Gender',
                                                  'What country do you *live* in?': 'Country of residence',
                                                  'What is your race?': 'Race'
})

### 2021

In [36]:
df_2021_reduced = df_2021[['Is your employer primarily a tech company/organization?',
                           'Does your employer provide mental health benefits as part of healthcare coverage?',
                           'Do you know the options for mental health care available under your employer-provided health coverage?',
                            'Do you *currently* have a mental health disorder?',
                            'Have you ever been *diagnosed* with a mental health disorder?',
                           'Do you have a family history of mental illness?',
                           'Have you ever discussed your mental health with your employer?',
                           'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?',
                           'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?',
                           'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?',
                           'Would you feel comfortable discussing a mental health issue with your coworkers?',
                           'How many employees does your company or organization have?',
                           'Overall, how well do you think the tech industry supports employees with mental health issues?',
                           'Have you observed or experienced an *unsupportive or badly handled response* to a mental health issue in your current or previous workplace?',
                           'Have you observed or experienced a *supportive or well handled response* to a mental health issue in your current or previous workplace?',
                           'What is your age?',
                           'What is your gender?',
                           'What country do you *live* in?',
                           'What is your race?',
                           ]]

In [37]:
df_2021_reduced = df_2021_reduced.rename(columns={'Is your employer primarily a tech company/organization?': 'tech company',
                                                  'Does your employer provide mental health benefits as part of healthcare coverage?': 'employer provided healthcare with mental benefits',
                                                  'Do you know the options for mental health care available under your employer-provided health coverage?': 'employer provided mental healthcare awareness',
                                                  'Do you *currently* have a mental health disorder?': 'current mental health disorder',
                                                  'Have you ever been *diagnosed* with a mental health disorder?': 'mental health diagnosis',
                                                  'Do you have a family history of mental illness?': 'family history of mental illness',
                                                  'Have you ever discussed your mental health with your employer?': 'discussed personal mental health with employer',
                                                  'Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?': 'anonymity protected when using benefits',
                                                  'If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?': 'ease of asking for leave',
                                                  'Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?': 'comfortable discussing a mental health issue with direct supervisor(s)',
                                                  'Would you feel comfortable discussing a mental health issue with your coworkers?': 'comfortable discussing a mental health issue with coworkers',
                                                  'How many employees does your company or organization have?': 'Number of employees',
                                                  'Overall, how well do you think the tech industry supports employees with mental health issues?': 'how well do you think the tech industry supports employees with mental health issues',
                                                  'Have you observed or experienced an *unsupportive or badly handled response* to a mental health issue in your current or previous workplace?': 'observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?',
                                                  'Have you observed or experienced a *supportive or well handled response* to a mental health issue in your current or previous workplace?': 'observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace',
                                                  'What is your age?': 'Age',
                                                  'What is your gender?': 'Gender',
                                                  'What country do you *live* in?': 'Country of residence',
                                                  'What is your race?': 'Race'
})

In [38]:
merged_df = df_2017_reduced.merge(df_2018_reduced, how='outer').merge(df_2020_reduced, how='outer').merge(df_2021_reduced, how='outer')
# MISSING 2019, column renaming may need to change (19 columns)

In [39]:
merged_df.columns.tolist()

['tech company',
 'employer provided healthcare with mental benefits',
 'employer provided mental healthcare awareness',
 'current mental health disorder',
 'mental health diagnosis',
 'family history of mental illness',
 'discussed personal mental health with employer',
 'anonymity protected when using benefits',
 'ease of asking for leave',
 'comfortable discussing a mental health issue with direct supervisor(s)',
 'comfortable discussing a mental health issue with coworkers',
 'Number of employees',
 'how well do you think the tech industry supports employees with mental health issues',
 'observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?',
 'observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace',
 'Age',
 'Gender',
 'Country of residence',
 'Race',
 'Start Date (UTC)',
 'Submit Date (UTC)']

In [40]:
csv_file_path = ("OSMI_clean.csv")
merged_df.to_csv(csv_file_path, index=False)