In [1]:
# import packages

# Basics
import pandas as pd
pd.set_option("display.max_columns", None)
import numpy as np

# Graphs
from matplotlib import pyplot as plt
%matplotlib inline
import seaborn as sns

# Filter warnings
import warnings
warnings.filterwarnings("ignore")

# Preprocessing; model selection and evaluation
from sklearn import pipeline, preprocessing
from sklearn.model_selection import cross_val_score, train_test_split, GridSearchCV
from sklearn.metrics import classification_report

# text handling
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.feature_extraction.text import TfidfVectorizer

# Models
from sklearn.linear_model import LogisticRegression, LinearRegression
from sklearn.ensemble import RandomForestClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.mixture import GaussianMixture
from sklearn.svm import SVC
from xgboost import XGBClassifier
from sklearn.cluster import AgglomerativeClustering, KMeans
from sklearn.neural_network import MLPClassifier
import statsmodels.api as sm

# for custom countvectorizer with SpaCy lemmatization
import spacy
from sklearn.feature_extraction.text import CountVectorizer, HashingVectorizer, VectorizerMixin
from sklearn.base import TransformerMixin, BaseEstimator
from scipy.sparse import csr_matrix

# WordCloud
from os import path
from PIL import Image
from wordcloud import WordCloud, STOPWORDS, ImageColorGenerator
from sklearn.feature_extraction.text import ENGLISH_STOP_WORDS

In [4]:
# import packages
data = pd.read_csv("Datasets/cleaned_labels_df.csv")
data.drop(columns = "Unnamed: 0",inplace=True)

df = data.copy()

In [5]:
df.head()

Unnamed: 0,id,Are you self-employed?,How many employees does your company or organization have?,Is your employer primarily a tech company/organization?,Is your primary role within your company related to tech/IT?,Does your employer provide mental health benefits as part of healthcare coverage?,Do you know the options for mental health care available under your employer-provided health coverage?,"Has your employer ever formally discussed mental health (for example, as part of a wellness campaign or other official communication)?",Does your employer offer resources to learn more about mental health disorders and options for seeking help?,Is your anonymity protected if you choose to take advantage of mental health or substance abuse treatment resources provided by your employer?,"If a mental health issue prompted you to request a medical leave from work, how easy or difficult would it be to ask for that leave?",Would you feel more comfortable talking to your coworkers about your physical health or your mental health?,Would you feel comfortable discussing a mental health issue with your direct supervisor(s)?,Have you ever discussed your mental health with your employer?,Would you feel comfortable discussing a mental health issue with your coworkers?,Have you ever discussed your mental health with coworkers?,Have you ever had a coworker discuss their or another coworker's mental health with you?,"Overall, how much importance does your employer place on physical health?","Overall, how much importance does your employer place on mental health?",Do you have previous employers?,Was your employer primarily a tech company/organization?,Have your previous employers provided mental health benefits?,Were you aware of the options for mental health care provided by your previous employers?,Did your previous employers ever formally discuss mental health (as part of a wellness campaign or other official communication)?,Did your previous employers provide resources to learn more about mental health disorders and how to seek help?,Was your anonymity protected if you chose to take advantage of mental health or substance abuse treatment resources with previous employers?,Would you have felt more comfortable talking to your previous employer about your physical health or your mental health?,Would you have been willing to discuss your mental health with your direct supervisor(s)?,Did you ever discuss your mental health with your previous employer?,Would you have been willing to discuss your mental health with your coworkers at previous employers?,Did you ever discuss your mental health with a previous coworker(s)?,Did you ever have a previous coworker discuss their or another coworker's mental health with you?,"Overall, how much importance did your previous employer place on physical health?","Overall, how much importance did your previous employer place on mental health?",Do you currently have a mental health disorder?,Have you ever been diagnosed with a mental health disorder?,Anxiety Disorder,Mood Disorder,Psychotic Disorder,Eating Disorder,Neurodevelopmental Disorders,Personality Disorder,Obsessive-Compulsive Disorder,Post-Traumatic Stress Disorder,Dissociative Disorder,Substance-Related and Addictive Disorders,Other,Adjustment disorder,Have you had a mental health disorder in the past?,Have you ever sought treatment for a mental health disorder from a mental health professional?,Do you have a family history of mental illness?,"If you have a mental health disorder, how often do you feel that it interferes with your work when being treated effectively?","If you have a mental health disorder, how often do you feel that it interferes with your work when NOT being treated effectively (i.e., when you are experiencing symptoms)?",Have your observations of how another individual who discussed a mental health issue made you less likely to reveal a mental health issue yourself in your current workplace?,How willing would you be to share with friends and family that you have a mental illness?,Would you be willing to bring up a physical health issue with a potential employer in an interview?,Why or why not?,Would you bring up your mental health with a potential employer in an interview?,Why or why not?.1,Are you openly identified at work as a person with a mental health issue?,"If they knew you suffered from a mental health disorder, how do you think that team members/co-workers would react?",Have you observed or experienced an unsupportive or badly handled response to a mental health issue in your current or previous workplace?,Have you observed or experienced supportive or well handled response to a mental health issue in your current or previous workplace?,"Overall, how well do you think the tech industry supports employees with mental health issues?",Briefly describe what you think the industry as a whole and/or employers could do to improve mental health support for employees.,What is your age?,What is your gender?,What country do you live in?,What US state or territory do you live in?,What is your race?,Start Date (UTC),Submit Date (UTC),Network ID
0,1,0,100-500,1.0,1.0,No,Yes,No,I don't know,I don't know,I don't know,Same level of comfort for each,Yes,0.0,Yes,1.0,1.0,6.0,0.0,1,0.0,I don't know,N/A (was not aware),Some did,Some did,"Yes, always",Physical health,"Yes, all of my previous supervisors",0.0,"No, at none of my previous employers",0.0,0.0,3.0,3.0,Possibly,Did not answer,1,0,0,0,0,0,0,0,0,0,0,0,Possibly,1,No,Sometimes,Sometimes,No,5,Yes,Did not answer,No,I'd be worried they wouldn't hire me,0.0,10.0,"Yes, I experienced","Yes, I experienced",1.0,They don't take it seriously,27.0,Female,United Kingdom,,Did not answer,2018-05-16 12:32:04,2018-05-16 12:42:40,464b7a12f1
1,2,0,100-500,1.0,1.0,Yes,Yes,No,No,I don't know,I don't know,Same level of comfort for each,Maybe,0.0,Yes,1.0,1.0,7.0,2.0,1,1.0,Some did,I was aware of some,None did,None did,I don't know,Physical health,"No, none of my previous supervisors",0.0,Some of my previous employers,1.0,0.0,5.0,2.0,Possibly,Did not answer,0,1,0,0,0,0,0,0,0,0,0,0,Possibly,0,No,Not applicable to me,Sometimes,No,4,Yes,it may require specific measures to accomodate...,No,mental health issues are stigmatised and misun...,0.0,6.0,"Yes, I observed",Maybe/Not sure,2.0,"raise awareness, talk about it to lessen the s...",31.0,Male,United Kingdom,,Did not answer,2018-05-16 12:31:13,2018-05-16 12:40:40,464b7a12f1
2,3,0,6-25,1.0,1.0,I don't know,No,I don't know,No,Yes,Difficult,Same level of comfort for each,Yes,1.0,Maybe,1.0,0.0,0.0,1.0,1,1.0,Some did,N/A (was not aware),None did,None did,I don't know,Physical health,"No, none of my previous supervisors",0.0,Some of my previous employers,1.0,0.0,8.0,0.0,Yes,Yes,1,1,0,0,0,0,0,0,0,1,0,0,Yes,1,Yes,Sometimes,Sometimes,Yes,5,Maybe,I will sometimes bring up my psoriasis just as...,No,stigma,1.0,5.0,"Yes, I experienced","Yes, I experienced",1.0,"Education and awareness, statistics, add suppo...",36.0,Male,United States of America,Missouri,Caucasian,2018-05-09 05:34:05,2018-05-09 05:46:04,1eb7e0cb94
3,4,0,More than 1000,1.0,1.0,Yes,Yes,I don't know,I don't know,Yes,Difficult,Same level of comfort for each,Yes,1.0,Yes,1.0,0.0,7.0,5.0,0,-1.0,Did not answer,Did not answer,Did not answer,Did not answer,Did not answer,Did not answer,Did not answer,-1.0,Did not answer,-1.0,-1.0,5.0,5.0,Yes,Yes,0,0,0,0,1,0,0,0,0,0,0,0,No,1,I don't know,Sometimes,Often,No,10,No,Anything that may hurt my chances to be hired ...,No,Might hurt my chances,0.0,5.0,Maybe/Not sure,Maybe/Not sure,2.0,"More support, less burnout and death marches",22.0,Male,United States of America,Washington,Caucasian,2018-05-04 23:19:14,2018-05-04 23:23:23,63852edbc4
4,5,1,0,-1.0,-1.0,Not Applicable,Not Applicable,Not Applicable,Not Applicable,Not Applicable,Not Applicable,Not Applicable,Not Applicable,-1.0,Not Applicable,-1.0,-1.0,5.0,5.0,1,0.0,"No, none did",N/A (none offered),None did,None did,"Yes, always",Same level of comfort for each,"No, none of my previous supervisors",0.0,"No, at none of my previous employers",1.0,1.0,8.0,8.0,No,Did not answer,0,0,0,0,0,0,0,0,0,0,0,0,Yes,1,Yes,Often,Sometimes,No,10,Maybe,It depends. it's not something you start with ...,No,Don't think it's connected to the job. You do ...,0.0,4.0,No,"Yes, I observed",1.0,I think tech is more internal and they don't r...,52.0,Female,United States of America,Illinois,Mixed,2018-05-03 00:40:24,2018-05-03 00:53:20,43237889f1
