In [35]:
# Dependencies/Libraries
%matplotlib notebook
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
!pip install vaderSentiment
import vaderSentiment



In [36]:
# Store filepath in a variable

file = "../KasiaProject/suicide_gender_data.csv"


In [37]:
# Loading a .csv file into a pandas DataFrame

file_df = pd.read_csv(file, encoding="ISO-8859-1")


In [38]:
# Show just the header (first 5 rows)
file_df.head()


Unnamed: 0,Year,Male,Female
0,1950,21.2,5.6
1,1960,20.0,5.6
2,1970,19.8,7.4
3,1980,19.9,5.7
4,1990,21.5,4.8


In [39]:
# Sorting by Year
file_df.sort_values(by='Year', ascending=False)


Unnamed: 0,Year,Male,Female
22,2016,21.4,6.0
21,2015,21.1,6.0
20,2014,20.7,5.8
19,2013,20.3,5.5
18,2012,20.4,5.4
17,2011,20.0,5.2
16,2010,19.8,5.0
15,2009,19.2,4.9
14,2008,19.0,4.8
13,2007,18.5,4.6


In [40]:
# Finding suicide average for males

male_mean_df = file_df["Male"].mean()

male_mean_df


19.56086956521739

In [41]:
# Finding suicide average for females

female_mean_df = file_df["Female"].mean()

female_mean_df


5.073913043478262

In [42]:
# Get current axis (ax allows reuse an axis to plot multiple lines)
ax = plt.gca() 

file_df.plot(kind='line', x='Year', y='Female', color='purple', ax=ax, linestyle='solid', linewidth=1.5, fontsize=8.5, figsize=(8,4))
file_df.plot(kind='line', x='Year', y='Male', color='red', linewidth=1.5, ax=ax, linestyle='solid')


# Adding customized grid line
ax.grid(linestyle=':', linewidth='0.5', color='gray')


# Adding Title
plt.title("Suicide Rates in the U.S. 1950-2016 (by gender)", fontname="Arial", fontsize=13)


# Adding Labels
plt.xlabel('Year', fontname="Arial", fontsize=9)
plt.ylabel('Percentage',fontname="Arial", fontsize=9)


# Display the plot
plt.show()


# Save plot as PDF
plt.savefig('suicide_gender.png')




<IPython.core.display.Javascript object>

In [43]:
from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer
analyzer = SentimentIntensityAnalyzer()


In [44]:
# Text to Analyze
suicide_string = "According to various research studies, differences in gender roles and expectations may account for some of the differences in suicidal behavior. The gender stereotype of men being tough and strong does not allow for failure, perhaps causing men to select a more violent and lethal method of suicide; while women, who are allowed, in  social acceptance terms, the option to express weakness and ask for help, may use suicide attempts as means of expressing their desire for assistance."


# Target String Setting
target_string = suicide_string


In [45]:
# Run analysis
results = analyzer.polarity_scores(target_string)
results


{'neg': 0.249, 'neu': 0.613, 'pos': 0.138, 'compound': -0.911}

In [46]:
# Run analysis
compound = results["compound"]


In [47]:
"""The Compound score is a metric that calculates the sum of all the 
lexicon ratings which have been normalized between -1 (most extreme negative) 
and +1 (most extreme positive)"""

# Print Analysis
print(target_string)
print("Compound Score:", compound)



According to various research studies, differences in gender roles and expectations may account for some of the differences in suicidal behavior. The gender stereotype of men being tough and strong does not allow for failure, perhaps causing men to select a more violent and lethal method of suicide; while women, who are allowed, in  social acceptance terms, the option to express weakness and ask for help, may use suicide attempts as means of expressing their desire for assistance.
Compound Score: -0.911
