In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline
import seaborn as sns



from PIL import Image
from wordcloud import WordCloud, STOPWORDS, ImageColorGenerator

## Loading Data

In [2]:
survey = pd.read_csv("survey.csv")

In [3]:
survey.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 173 entries, 0 to 172
Data columns (total 37 columns):
 #   Column                                                                                                                                                          Non-Null Count  Dtype  
---  ------                                                                                                                                                          --------------  -----  
 0   Respondent ID                                                                                                                                                   173 non-null    int64  
 1   Collector ID                                                                                                                                                    173 non-null    int64  
 2   Start Date                                                                                                                            

## CLEANING DATA

In [4]:
# In person ID > 5 
survey["IP Address"].value_counts()

209.52.88.251      8
208.98.223.72      7
137.82.216.1       5
24.114.37.253      5
173.180.3.1        4
                  ..
24.86.237.205      1
184.151.230.21     1
50.64.41.156       1
216.180.68.136     1
184.151.230.115    1
Name: IP Address, Length: 133, dtype: int64

In [5]:
# Brand awareness
survey["Have you heard of the Marine Mammal Rescue Centre (MMR)?"].value_counts(normalize = True)

Yes    0.672515
No     0.327485
Name: Have you heard of the Marine Mammal Rescue Centre (MMR)?, dtype: float64

In [6]:
# 173 respondents
survey.shape

(173, 37)

In [7]:
# 2 respondents didn't answer the first question, and neither the following question. I'm going to delete those 2 rows.
survey[survey["Have you heard of the Marine Mammal Rescue Centre (MMR)?"].isna()]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"
164,11374766669,254782488,02/26/2020 04:35:00 PM,02/26/2020 04:37:43 PM,24.244.23.115,,,,,,...,,,,,,,,,,
165,11374216484,254707048,02/26/2020 01:05:32 PM,02/26/2020 02:29:16 PM,137.82.216.1,,,,,,...,,,,,,High-school diploma,,,,


In [8]:
survey = survey.drop(survey.index[165])

In [9]:
survey = survey.drop(survey.index[164])

In [10]:
survey[survey["Have you heard of the Marine Mammal Rescue Centre (MMR)?"].isna()]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"


In [11]:
#171 respondents total
survey.shape

(171, 37)

In [12]:
# 32 respondents didn't answer on average 14 questions in the survey. 
survey[survey["Have you donated to a charity in the past year?"].isna()].iloc[:,13:32]

Unnamed: 0,"Don’t do anything, let nature take its course","Call MMR, the Vancouver Aquarium, or a local rehabilitation centre",Take it home and care for it,Keep people and pets away,Take the mammal to the nearest veterinary clinic,Have you donated to a charity in the past year?,What type of charity/cause have you most frequently donated to in the past year?,Other (please specify).1,Can you share why you donated to that specific charity/cause?,How did you find out about that specific charity/cause?,Other (please specify).2,How do you prefer to make your donations?,Other (please specify).3,Have you considered donating money to the Marine Mammal Rescue Center?,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?
10,,,,,,,,,,,,,,,,,,,
14,,,,,,,,,,,,,,,,,,,
30,,,,,,,,,,,,,,,,,,,
31,,,,,,,,,,,,,,,,,,,
32,2.0,3.0,4.0,5.0,6.0,,,,,,,,,,,,,,
40,,,,,,,,,,,,,,,,,,,
53,,,,,,,,,,,,,,,,,,,
54,,,,,,,,,,,,,,,,,,,
56,,,,,,,,,,,,,,,,,,,
74,,,,,,,Health,,,,,,,,,,,,


In [13]:
survey[survey["Have you donated to a charity in the past year?"].isna()]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"
10,11387067669,254782488,03/02/2020 07:23:08 PM,03/02/2020 07:23:18 PM,64.180.214.58,No,,,,,...,,,,,,,,,,
14,11386826316,254782488,03/02/2020 05:02:50 PM,03/02/2020 05:03:29 PM,24.244.23.81,Yes,Friend,,Positive,,...,,,,,,,,,,
30,11385610751,254782488,03/02/2020 09:03:43 AM,03/02/2020 09:04:53 AM,24.69.120.202,Yes,News,,Positive,Very supportive of wildlife rescue efforts,...,,,,,,,,,,
31,11385596165,254782488,03/02/2020 08:59:02 AM,03/02/2020 08:59:36 AM,198.202.137.28,No,,,,,...,,,,,,,,,,
32,11385574724,254782488,03/02/2020 08:52:29 AM,03/02/2020 09:36:06 AM,24.87.190.131,Yes,News,,Positive,I believe in the help for animals in need.,...,,,,,,,,,,
40,11384134997,254782488,03/01/2020 07:15:57 PM,03/01/2020 07:16:36 PM,173.180.128.162,Yes,Vancouver Aquarium,,,,...,,,,,,,,,,
53,11383782807,254782488,03/01/2020 02:28:45 PM,03/01/2020 02:28:59 PM,47.156.169.224,No,,,,,...,,,,,,,,,,
54,11383760369,254782488,03/01/2020 02:08:12 PM,03/01/2020 02:08:28 PM,70.71.240.197,No,,,,,...,,,,,,,,,,
56,11383653016,254782488,03/01/2020 12:25:02 PM,03/01/2020 12:25:39 PM,142.179.72.92,Yes,Vancouver Aquarium,,Positive,,...,,,,,,,,,,
74,11382910639,254782488,02/29/2020 10:16:03 PM,02/29/2020 10:20:23 PM,207.6.51.227,Yes,,family member,Positive,It's important to rescue and rehabilitate mamm...,...,,,,,,,Yes,,,


In [14]:
survey["Have you donated to a charity in the past year?"].fillna("Haven't answered it", inplace = True)

In [15]:
survey[survey["Have you donated to a charity in the past year?"] == "Haven't answered it"]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"
10,11387067669,254782488,03/02/2020 07:23:08 PM,03/02/2020 07:23:18 PM,64.180.214.58,No,,,,,...,,,,,,,,,,
14,11386826316,254782488,03/02/2020 05:02:50 PM,03/02/2020 05:03:29 PM,24.244.23.81,Yes,Friend,,Positive,,...,,,,,,,,,,
30,11385610751,254782488,03/02/2020 09:03:43 AM,03/02/2020 09:04:53 AM,24.69.120.202,Yes,News,,Positive,Very supportive of wildlife rescue efforts,...,,,,,,,,,,
31,11385596165,254782488,03/02/2020 08:59:02 AM,03/02/2020 08:59:36 AM,198.202.137.28,No,,,,,...,,,,,,,,,,
32,11385574724,254782488,03/02/2020 08:52:29 AM,03/02/2020 09:36:06 AM,24.87.190.131,Yes,News,,Positive,I believe in the help for animals in need.,...,,,,,,,,,,
40,11384134997,254782488,03/01/2020 07:15:57 PM,03/01/2020 07:16:36 PM,173.180.128.162,Yes,Vancouver Aquarium,,,,...,,,,,,,,,,
53,11383782807,254782488,03/01/2020 02:28:45 PM,03/01/2020 02:28:59 PM,47.156.169.224,No,,,,,...,,,,,,,,,,
54,11383760369,254782488,03/01/2020 02:08:12 PM,03/01/2020 02:08:28 PM,70.71.240.197,No,,,,,...,,,,,,,,,,
56,11383653016,254782488,03/01/2020 12:25:02 PM,03/01/2020 12:25:39 PM,142.179.72.92,Yes,Vancouver Aquarium,,Positive,,...,,,,,,,,,,
74,11382910639,254782488,02/29/2020 10:16:03 PM,02/29/2020 10:20:23 PM,207.6.51.227,Yes,,family member,Positive,It's important to rescue and rehabilitate mamm...,...,,,,,,,Yes,,,


In [16]:
remove_list = ["Haven't answered it"]
survey_v1 = survey[~survey["Have you donated to a charity in the past year?"].isin(remove_list)]


In [17]:
survey_v1.shape

(139, 37)

In [18]:
survey_v1.isna().sum()

Respondent ID                                                                                                                                                       0
Collector ID                                                                                                                                                        0
Start Date                                                                                                                                                          0
End Date                                                                                                                                                            0
IP Address                                                                                                                                                          0
Have you heard of the Marine Mammal Rescue Centre (MMR)?                                                                                                            0
How 

In [19]:
survey_v1.head(7)

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"
0,11392865280,254782488,03/04/2020 02:02:23 PM,03/04/2020 02:08:09 PM,70.78.136.94,Yes,Vancouver Aquarium,,Positive,I am a great supporter of the Van Aquarium and...,...,Yes,Abbotsford,British Columbia,Canada,50-64,Bachelor’s degree,No,Donor,,
1,11391985875,254782488,03/04/2020 09:23:12 AM,03/04/2020 09:28:37 AM,174.7.248.66,Yes,Vancouver Aquarium,,Positive,It helps numerous marine mammals every year wh...,...,Yes,Vancouver,BC,Canada,50-64,Master’s or doctoral degree,Yes,Volunteer,,laura.childerson@gmail.com
2,11390176092,254782488,03/03/2020 07:09:15 PM,03/03/2020 07:14:38 PM,70.79.224.29,Yes,Vancouver Aquarium,,Positive,MMR does good work rehabilitating animals,...,Yes,Richmond,BC,Canada,50-64,Master’s or doctoral degree,No,Volunteer,,
3,11389898511,254782488,03/03/2020 04:45:10 PM,03/03/2020 04:58:49 PM,165.225.38.23,Yes,News,,Positive,They do good work,...,No,Langley,British Columbia,Canada,50-64,Bachelor’s degree,No,No affiliation,,
4,11389156335,254782488,03/03/2020 12:07:26 PM,03/03/2020 12:10:40 PM,172.255.50.186,No,,,,,...,Need to know more,Delta,British Columbia,Canada,25-34,Bachelor’s degree,No,No affiliation,,stephen_lee_94@hotmail.com
5,11388596474,254782488,03/03/2020 09:02:53 AM,03/03/2020 09:06:59 AM,72.143.223.66,No,,,,,...,No,Vancouver,BC,Canada,25-34,Bachelor’s degree,No,No affiliation,,
6,11388537401,254782488,03/03/2020 08:44:18 AM,03/03/2020 08:48:24 AM,24.114.44.255,No,,,,,...,Yes,Coquitlam,BC,Canada,25-34,Master’s or doctoral degree,No,No affiliation,,


In [20]:
survey_v1.loc[survey_v1["Have you heard of the Marine Mammal Rescue Centre (MMR)?"] == "No"].iloc[:,5:11]
 

Unnamed: 0,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,Please describe what a marine mammal in distress looks like to you?
4,No,,,,,Escaping the water due to toxic conditions (po...
5,No,,,,,Not sure
6,No,,,,,"caught in nets, stomach full of plastic, sound..."
7,No,,,,,A mammal kept in inappropriate living conditio...
8,No,,,,,"Obvious physical trauma, swimming frantically,..."
9,No,,,,,A whale or dolphin eating plastic
11,No,,,,,"Mammal caught in fish net, or plastics. Mammal..."
12,No,,,,,
19,No,,,,,Being tangled in garbage (e.g. plastics) and s...
22,No,,,,,"Eyes look tired, movement and mannerisms do no..."


In [21]:
mask = (survey_v1['Have you heard of the Marine Mammal Rescue Centre (MMR)?']=="No")
mean = "Haven't heard of it"
survey_v1.loc[mask, 'Other (please specify)'] = survey_v1.loc[mask, 'Other (please specify)'].fillna(mean)



A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self.obj[item] = s


In [22]:
col_list = ["How did you hear about the MMR?",
            "Other (please specify)",
            "On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",
            "Please explain why you chose your selected ranking?"]

In [23]:
for col in col_list:
    mask = (survey_v1['Have you heard of the Marine Mammal Rescue Centre (MMR)?']=="No")
    mean = "Haven't heard of it"
    survey_v1.loc[mask, col] = survey_v1.loc[mask, col].fillna(mean)
    

In [24]:
survey_v1[survey_v1["How did you hear about the MMR?"].isna()]
survey_v1["How did you hear about the MMR?"].fillna("Didn't answered it", inplace = True)



A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self._update_inplace(new_data)


In [25]:
survey_v1[survey_v1["Other (please specify)"].isna()]
survey_v1["Other (please specify)"].fillna("Answered in the previous question",inplace = True)

In [26]:
survey["Other (please specify)"].unique()

array([nan, 'Bamfield marine science center ', 'Daughter',
       'family member', 'I am a volunteer there.'], dtype=object)

In [27]:
survey_v1[survey_v1["On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?"].isna()]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"
15,11386695569,254782488,03/02/2020 03:59:23 PM,03/02/2020 04:06:34 PM,72.143.216.198,Yes,Didn't answered it,Bamfield marine science center,,"I’ve heard of it, I don’t know anything about it.",...,Yes,Port Moody,BC,Can,35-49,Bachelor’s degree,No,No affiliation,,Ryanlucier1@gmail.com


In [28]:
survey_v1["On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?"].fillna("Didn't answer it", inplace = True)

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self._update_inplace(new_data)


In [29]:
survey_v1[survey_v1["Please explain why you chose your selected ranking?"].isna()]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,Have you considered donating money to ocean health and conservation causes?,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:"
25,11385710715,254782488,03/02/2020 09:36:34 AM,03/02/2020 09:43:59 AM,24.87.190.131,Yes,News,Answered in the previous question,Positive,,...,No,MR,BC,CANADA,65+,,,,,
36,11384350062,254782488,03/01/2020 10:56:03 PM,03/01/2020 10:58:54 PM,184.71.165.190,Yes,Friend,Answered in the previous question,Neutral,,...,No,Victoria,British columbia,Canada,35-49,Master’s or doctoral degree,No,Member,,
44,11383972225,254782488,03/01/2020 05:07:47 PM,03/01/2020 05:11:58 PM,70.71.116.174,Yes,Friend,Answered in the previous question,Somewhat Positive,,...,No,,,,50-64,,No,No affiliation,,
57,11383544387,254782488,03/01/2020 10:36:21 AM,03/01/2020 10:41:33 AM,66.183.73.135,Yes,Vancouver Aquarium,Answered in the previous question,Positive,,...,Yes,Vancouver,BC,Canada,65+,,Yes,Volunteer,,
99,11382746808,254782488,02/29/2020 06:35:14 PM,02/29/2020 06:40:59 PM,99.199.18.52,Yes,Social media,Answered in the previous question,Positive,,...,Yes,North Vancouver,British Columbia,Canada,Under 25,College or CEGEP diploma,No,Volunteer,,
132,11382485059,254782488,02/29/2020 01:33:41 PM,02/29/2020 01:38:53 PM,24.114.43.253,Yes,Vancouver Aquarium,Answered in the previous question,Positive,,...,No,Vancouver,Bc,Canada,50-64,College or CEGEP diploma,No,,Past volunteer,Vangal727@gmail.com
142,11382455627,254782488,02/29/2020 12:48:13 PM,02/29/2020 01:07:29 PM,24.114.25.201,Yes,Vancouver Aquarium,Answered in the previous question,Somewhat Positive,,...,No,Surrey,Bc,Can,25-34,Bachelor’s degree,No,Member,,Sunweipop@gmail.com


In [30]:
survey_v1["Please explain why you chose your selected ranking?"].fillna("Didn't answer it", inplace = True)

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self._update_inplace(new_data)


In [31]:
# filling 0 where they haven't ranked the options
columns_list = ['Please state what actions you would take if you came across a marine mammal in distress. (Rank your choices with 1 being the best).  Feed the mammal shellfish',
       'Don’t do anything, let nature take its course',
       'Call MMR, the Vancouver Aquarium, or a local rehabilitation centre',
       'Take it home and care for it', 'Keep people and pets away',
       'Take the mammal to the nearest veterinary clinic']

for col in columns_list:
    survey_v1[col].fillna(0,inplace = True)

In [32]:
columns_survey = survey_v1.columns

In [33]:
for col in columns_survey:
    survey_v1[col].fillna("Didn't answer it",inplace = True)

In [34]:
survey_v1.isna().sum()

Respondent ID                                                                                                                                                     0
Collector ID                                                                                                                                                      0
Start Date                                                                                                                                                        0
End Date                                                                                                                                                          0
IP Address                                                                                                                                                        0
Have you heard of the Marine Mammal Rescue Centre (MMR)?                                                                                                          0
How did you hear

In [35]:
# For better analysis, we are going to divide the respondents into 2 clusters
# 0 for no affiliation
# 1 for affiliated with Vancouver Aquarium 

In [36]:
survey_v1["Do you have an affiliation to the Vancouver Aquarium?"].unique()

array(['Donor', 'Volunteer', 'No affiliation', "Didn't answer it",
       'Member', 'Staff'], dtype=object)

In [37]:
affiliation = ['Donor', 'Volunteer',
       'Member', 'Staff']
clusters = []

for answer in survey_v1["Do you have an affiliation to the Vancouver Aquarium?"]:
    if answer in affiliation:
        clusters.append(1)
        
    else:
        clusters.append(0)
    

In [38]:
len(clusters)

139

In [39]:
survey_v1.shape

(139, 37)

In [40]:
survey_v1["clusters"] = clusters

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  """Entry point for launching an IPython kernel.


In [41]:
survey_v1.head()

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:",clusters
0,11392865280,254782488,03/04/2020 02:02:23 PM,03/04/2020 02:08:09 PM,70.78.136.94,Yes,Vancouver Aquarium,Answered in the previous question,Positive,I am a great supporter of the Van Aquarium and...,...,Abbotsford,British Columbia,Canada,50-64,Bachelor’s degree,No,Donor,Didn't answer it,Didn't answer it,1
1,11391985875,254782488,03/04/2020 09:23:12 AM,03/04/2020 09:28:37 AM,174.7.248.66,Yes,Vancouver Aquarium,Answered in the previous question,Positive,It helps numerous marine mammals every year wh...,...,Vancouver,BC,Canada,50-64,Master’s or doctoral degree,Yes,Volunteer,Didn't answer it,laura.childerson@gmail.com,1
2,11390176092,254782488,03/03/2020 07:09:15 PM,03/03/2020 07:14:38 PM,70.79.224.29,Yes,Vancouver Aquarium,Answered in the previous question,Positive,MMR does good work rehabilitating animals,...,Richmond,BC,Canada,50-64,Master’s or doctoral degree,No,Volunteer,Didn't answer it,Didn't answer it,1
3,11389898511,254782488,03/03/2020 04:45:10 PM,03/03/2020 04:58:49 PM,165.225.38.23,Yes,News,Answered in the previous question,Positive,They do good work,...,Langley,British Columbia,Canada,50-64,Bachelor’s degree,No,No affiliation,Didn't answer it,Didn't answer it,0
4,11389156335,254782488,03/03/2020 12:07:26 PM,03/03/2020 12:10:40 PM,172.255.50.186,No,Haven't heard of it,Haven't heard of it,Haven't heard of it,Haven't heard of it,...,Delta,British Columbia,Canada,25-34,Bachelor’s degree,No,No affiliation,Didn't answer it,stephen_lee_94@hotmail.com,0


In [42]:
survey_v1[survey_v1["Do you have an affiliation to MMR?"] == "Didn't answer it"]

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:",clusters
25,11385710715,254782488,03/02/2020 09:36:34 AM,03/02/2020 09:43:59 AM,24.87.190.131,Yes,News,Answered in the previous question,Positive,Didn't answer it,...,MR,BC,CANADA,65+,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,0
168,11372013645,254715558,02/25/2020 10:09:29 PM,02/25/2020 10:10:07 PM,96.49.200.74,No,Haven't heard of it,Haven't heard of it,Haven't heard of it,Haven't heard of it,...,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,0


In [43]:
survey_v1[survey_v1["Do you have an affiliation to the Vancouver Aquarium?"] == "Didn't answer it"]
# a few respondents were past volunteers or members and I will add them to the cluster 1

Unnamed: 0,Respondent ID,Collector ID,Start Date,End Date,IP Address,Have you heard of the Marine Mammal Rescue Centre (MMR)?,How did you hear about the MMR?,Other (please specify),"On a scale of 1-5 with 1 being negative and 5 being positive, how do you feel about the Marine Mammal Rescue Centre’s services?",Please explain why you chose your selected ranking?,...,City/Town,State/Province,Country,What is your age?,What is the highest level of education achieved?,Do you have an affiliation to MMR?,Do you have an affiliation to the Vancouver Aquarium?,Other (please specify).4,"If you would like to be entered into a random draw for two general admission passes to the Vancouver Aquarium, please share your email address:",clusters
16,11386669614,254782488,03/02/2020 03:46:19 PM,03/02/2020 03:51:32 PM,137.82.216.1,Yes,Vancouver Aquarium,Answered in the previous question,Positive,They help animals in need. If they didn't res...,...,Richmond,BC - British Columbia,Canada,50-64,Bachelor’s degree,No,Didn't answer it,Past member,leanne.bernaerdt@ubc.ca,0
20,11386000418,254782488,03/02/2020 11:18:05 AM,03/02/2020 11:30:30 AM,137.82.216.1,Yes,Affiliated organization,Answered in the previous question,Somewhat Positive,I have confidence that MMR does good work and ...,...,Vancouver,BC,Canada,35-49,Bachelor’s degree,No,Didn't answer it,Customer,Didn't answer it,0
25,11385710715,254782488,03/02/2020 09:36:34 AM,03/02/2020 09:43:59 AM,24.87.190.131,Yes,News,Answered in the previous question,Positive,Didn't answer it,...,MR,BC,CANADA,65+,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,0
73,11382910710,254782488,02/29/2020 10:16:19 PM,02/29/2020 10:21:50 PM,174.7.107.208,Yes,Vancouver Aquarium,Answered in the previous question,Positive,Taking of animals in need is what humans have ...,...,Vancouver,Bc,Canada,50-64,Bachelor’s degree,Yes,Didn't answer it,Past volunteer,Piadewdney@gmail.com,0
132,11382485059,254782488,02/29/2020 01:33:41 PM,02/29/2020 01:38:53 PM,24.114.43.253,Yes,Vancouver Aquarium,Answered in the previous question,Positive,Didn't answer it,...,Vancouver,Bc,Canada,50-64,College or CEGEP diploma,No,Didn't answer it,Past volunteer,Vangal727@gmail.com,0
168,11372013645,254715558,02/25/2020 10:09:29 PM,02/25/2020 10:10:07 PM,96.49.200.74,No,Haven't heard of it,Haven't heard of it,Haven't heard of it,Haven't heard of it,...,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,Didn't answer it,0


In [44]:
survey_v1.loc[survey_v1["Other (please specify).4"] == "Past member", 'clusters'] = 1





A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self.obj[item] = s


In [45]:
survey_v1.loc[survey_v1["Other (please specify).4"] == 'Member and volunteer.', 'clusters'] = 1

In [46]:
survey_v1.loc[survey_v1["Other (please specify).4"] == "Past volunteer ", 'clusters'] = 1

In [48]:
#survey_v1.to_csv("survey_v2.csv")