In [14]:
import os

import pandas as pd

## toplines & visuals
# from pandas_profiling import ProfileReport
import sweetviz as sv

import numpy as np

pd.set_option('display.max_columns', None)
# pd.set_option('display.max_colwidth', None)

## set notebook to 100% width of page
from IPython.core.display import display, HTML
display(HTML("<style>.container { width:100% !important; }</style>"))

# Data

In [15]:
surveys = pd.read_csv('./datasets/dpp/2016-survey-data-kaggle/VOTER_Survey_December16_Release1.csv')
surveys.columns = surveys.columns.str.lower()

q1 = pd.read_csv('../job-apply/interviews/gsg/data/question1_data.csv')

questions = pd.read_csv('../job-apply/interviews/gsg/data/question4_files/questions.csv')
responses = pd.read_csv('../job-apply/interviews/gsg/data/question4_files/responses.csv')
weight_schemes = pd.read_csv('../job-apply/interviews/gsg/data/question4_files/weight_schemes.csv')
respondent_data = pd.read_csv('../job-apply/interviews/gsg/data/question4_files/respondent_data.csv')
respondent_weight = pd.read_csv('../job-apply/interviews/gsg/data/question4_files/respondent_weights.csv')

  exec(code_obj, self.user_global_ns, self.user_ns)


# Toplines

In [7]:
## QUESTION - RESPONSE - FREQUENCY - PERCENTAGE

In [8]:
q_18058 = questions[questions['project_id'] == 18058].sort_values('question_id')
q_18390 = questions[questions['project_id'] == 18390].sort_values('question_id')

r_18058 = responses[responses['project_id'] == 18058].sort_values('question_id')
r_18390 = responses[responses['project_id'] == 18390].sort_values('question_id')

rd_18058 = respondent_data[respondent_data['project_id'] == 18058].sort_values('question_id')
rd_18390 = respondent_data[respondent_data['project_id'] == 18390].sort_values('question_id')

rw_18058 = respondent_weight[respondent_weight['project_id'] == 18058]
rw_18390 = respondent_weight[respondent_weight['project_id'] == 18390]

ws_18058 = weight_schemes[weight_schemes['project_id'] == 18058]
ws_18390 = weight_schemes[weight_schemes['project_id'] == 18390]

In [9]:
## combine questions & response on 'responses'
output_18058 = r_18058.merge(q_18058, how='left', on='question_id')
## remove unneeded cols
output_18058 = output_18058[['question_id', 'response', 
                             'response_index', 'text_y','text_x']]
output_18058.rename(columns={
    'text_y': 'question_text',
    'text_x': 'response_text'
}, inplace=True)

## order the cols by question and respnse
output_18058.sort_values(['question_id', 'response'], inplace=True)

## corr resp_weights to weight scheme marked 'final' in weight_schemes
cond = (ws_18058['name'] == 'Final')
w_id = ws_18058[cond]['weight_scheme_id'].values[0]

rw_18058 = rw_18058[rw_18058['weight_scheme_id'] == w_id]

In [10]:
## weights are tied to individual respondent id's
## For more info/background on weighted tables in survey data, ref'd from source:
    ## https://www.datarevelations.com/working-with-weighted-survey-data/
## perc is the % of overall choice in category/question

## combine the weights corr to respondent, response, and question.
m_weights_18058 = rd_18058.merge(rw_18058, how='left', 
                                 on='respondent_id').sort_values('respondent_id').groupby(['question_id', 
                                                                                           'response'], 
                                                                                           as_index=False).sum()
## merge with questions/respondents data
output_18058 = pd.merge(output_18058, m_weights_18058, how='left', 
                        left_on=['question_id', 'response'],
                        right_on=['question_id', 'response'])

## clean cols, round floats down
output_18058.rename(columns={'weight': 'freq_weight'}, inplace=True)
output_18058['freq_weight'].fillna(0, inplace=True)
output_18058['freq_weight'] = output_18058['freq_weight'].apply(lambda x: np.round(x, 1))

## the meat and potatoes:
cumsum = output_18058.groupby(['question_id']).sum().groupby(level=0).cumsum().reset_index()
output_18058 = output_18058.merge(cumsum, how='left', on='question_id')

output_18058['percent_weighted'] = output_18058['freq_weight_x'] / output_18058['freq_weight_y']

output_18058 = output_18058[['question_id', 'question_text', 'response_text', 
                             'freq_weight_x', 'percent_weighted']].rename(columns={'freq_weight_x': 'freq_weighted'})
output_18058

Unnamed: 0,question_id,question_text,response_text,freq_weighted,percent_weighted
0,A19,Shares your values,Very well,30.8,0.152929
1,A19,Shares your values,Somewhat well,71.4,0.354518
2,A19,Shares your values,Not very well,23.1,0.114697
3,A19,Shares your values,Not well at all,43.4,0.215492
4,A19,Shares your values,(Don't know/Refused),32.7,0.162363
...,...,...,...,...,...
248,V1,"If the election for US Congress was today, for...",John Crichton,125.7,0.311833
249,V1,"If the election for US Congress was today, for...",Lean John Crichton,4.4,0.010915
250,V1,"If the election for US Congress was today, for...",(Undecided/Refused),58.3,0.144629
251,VER,VERSION,A,201.5,0.500000


# Crosstabs, Pivot Tables

In [16]:
print(surveys.shape)
surveys.head()

(8000, 668)


Unnamed: 0,case_identifier,weight,party_agendas_rand_2016,pp_primary16_2016,pp_demprim16_2016,pp_repprim16_2016,inputstate_2016,izip_2016,votereg2_2016,votereg_f_2016,regzip_2016,turnout16_2016,vote_usual_2016,votemeth16_2016,presvote16post_2016,presvote16post_t_2016,vote2016_cand2_2016,vote_for_against_2016,clinton_rubio_2016,clinton_cruz_2016,sanders_trump_2016,sanders_rubio_2016,wished_voted_2016,vote_regrets_2016,second_chance_2016,second_chance_t_2016,accurately_counted_2016,accurately_counted2_2016,obamaapp_2016,fav_trump_2016,fav_cruz_2016,fav_ryan_2016,fav_romn_2016,fav_obama_2016,fav_hrc_2016,fav_sanders_2016,fav_rubio_2016,party_agendas_d1_2016,party_agendas_d2_2016,party_agendas_d3_2016,party_agendas_d4_2016,party_agendas_d5_2016,party_agendas_d6_2016,party_agendas_d7_2016,party_agendas_d8_2016,party_agendas_d9_2016,party_agendas_d10_2016,party_agendas_d11_2016,party_agendas_d12_2016,party_agendas_r1_2016,party_agendas_r2_2016,party_agendas_r3_2016,party_agendas_r4_2016,party_agendas_r5_2016,party_agendas_r6_2016,party_agendas_r7_2016,party_agendas_r8_2016,party_agendas_r9_2016,party_agendas_r10_2016,party_agendas_r11_2016,party_agendas_r12_2016,rigged_system_1_2016,rigged_system_2_2016,rigged_system_3_2016,rigged_system_4_2016,rigged_system_5_2016,rigged_system_6_2016,track_2016,persfinretro_2016,econtrend_2016,americatrend_2016,futuretrend_2016,wealth_2016,values_culture_2016,us_respect_2016,trustgovt_2016,trust_people_2016,helpful_people_2016,fair_people_2016,ft_black_2016,ft_white_2016,ft_hisp_2016,ft_asian_2016,ft_muslim_2016,ft_jew_2016,ft_christ_2016,ft_fem_2016,ft_immig_2016,ft_blm_2016,ft_wallst_2016,ft_gays_2016,ft_unions_2016,ft_police_2016,ft_altright_2016,imiss_a_2016,imiss_b_2016,imiss_c_2016,imiss_d_2016,imiss_e_2016,imiss_f_2016,imiss_g_2016,imiss_h_2016,imiss_i_2016,imiss_j_2016,imiss_k_2016,imiss_l_2016,imiss_m_2016,imiss_n_2016,imiss_o_2016,imiss_p_2016,imiss_q_2016,imiss_r_2016,imiss_s_2016,imiss_t_2016,imiss_u_2016,imiss_x_2016,imiss_y_2016,immi_contribution_2016,immi_naturalize_2016,immi_makedifficult_2016,immi_muslim_2016,abortview3_2016,gaymar_2016,view_transgender_2016,deathpen_2016,deathpenfreq_2016,police_threat_2016,conviction_accuracy_2016,univhealthcov_2016,healthreformbill_2016,envwarm_2016,envpoll2_2016,affirmact_gen_2016,taxdoug_2016,govt_reg_2016,gvmt_involment_2016,tradepolicy_2016,free_trade_1_2016,free_trade_2_2016,free_trade_3_2016,free_trade_4_2016,free_trade_5_2016,amcitizen_2016,amshamed_2016,belikeus_2016,prouddem_2016,proudhis_2016,proudgrp_2016,ambornin_2016,amcit_2016,amlived_2016,amenglish_2016,amchrstn_2016,amgovt_2016,amwhite_2016,amdiverse_2016,sexism1_2016,sexism2_2016,sexism3_2016,sexism4_2016,sexism5_2016,sexism6_2016,gender_equality_2016,race_deservemore_2016,race_overcome_2016,race_tryharder_2016,race_slave_2016,policies_favor_2016,reverse_discrimination_2016,inc_opp_blacks_2016,race_majority_1_2016,race_majority_2_2016,race_majority_3_2016,race_majority_4_2016,social_conformity_1_2016,social_conformity_2_2016,social_conformity_3_2016,social_conformity_4_2016,civic_participation_2016,political_correctness_2016,race_2016,race_other_2016,race_fate_2016,race_importance_2016,labunmemb_2016,milstat_1_2016,milstat_2_2016,milstat_3_2016,milstat_4_2016,milstat_5_2016,gunown_2016,smoke100_2016,smokenow_2016,healthdk_0_2016,healthcov2_2016,healthcov_t_2016,alcohol_2016,painkillers_2016,drugs_2016,victim_12mo_2016,educ_2016,marstat_2016,child18_2016,employ_2016,employ_t_2016,faminc_2016,pid3_2016,pid3_t_2016,pid7_2016,ideo5_2016,newsint_2016,pew_bornagain_2016,pew_religimp_2016,pew_churatd_2016,pew_prayer_2016,religpew_2016,religpew_t_2016,votemeth16_rnd_2016,presvote16post_rnd_2016,vote2016_cand2_rnd_2016,clinton_rubio_rnd_2016,clinton_cruz_rnd_2016,sanders_trump_rnd_2016,sanders_rubio_rnd_2016,second_chance_rnd_2016,obamaapp_rnd_2016,fav_grid_row_rnd_2016,fav_grid_col_rnd_2016,party_agendas_d_grid_row_rnd_201,party_agendas_r_grid_row_rnd_201,rigged_system_grid_row_rnd_2016,track_rnd_2016,persfinretro_rnd_2016,econtrend_rnd_2016,americatrend_rnd_2016,futuretrend_rnd_2016,wealth_rnd_2016,values_culture_rnd_2016,us_respect_rnd_2016,trust_people_rnd_2016,helpful_people_rnd_2016,fair_people_rnd_2016,t1_grid_row_rnd_2016,imiss_row_rnd_2016,imiss_col_rnd_2016,immi_contribution_rnd_2016,immi_naturalize_rnd_2016,immi_makedifficult_rnd_2016,immi_muslim_rnd_2016,abortview3_rnd_2016,gaymar_rnd_2016,view_transgender_rnd_2016,deathpen_rnd_2016,police_threat_rnd_2016,conviction_accuracy_rnd_2016,healthreformbill_rnd_2016,envwarm_rnd_2016,envpoll2_rnd_2016,affirmact_gen_rnd_2016,taxdoug_rnd_2016,gvmt_involment_rnd_2016,tradepolicy_rnd_2016,free_trade_grid_row_rnd_2016,agree_grid_row_rnd_2016,proud_grid_row_rnd_2016,conceptions_grid_row_rnd_2016,sexism_grid_row_rnd_2016,gender_equality_rnd_2016,racialresent_grid_row_rnd_2016,race_majority_row_rnd_2016,m_sc_1_sc_4_rnd_2016,social_conformity_1_grid_col_rnd,social_conformity_2_grid_col_rnd,social_conformity_3_grid_col_rnd,social_conformity_4_grid_col_rnd,political_correctness_rnd_2016,gunown_rnd_2016,newsint2_baseline,track_baseline,trustgovt_baseline,persfinretro_baseline,econtrend_baseline,fatalism2_baseline,obamaapp_baseline,watchtv_baseline,morn_show_1_baseline,morn_show_2_baseline,morn_show_3_baseline,morn_show_4_baseline,morn_show_5_baseline,morn_show_6_baseline,morn_show_99_baseline,enews_show_1_baseline,enews_show_2_baseline,enews_show_3_baseline,enews_show_4_baseline,enews_show_5_baseline,enews_show_6_baseline,enews_show_7_baseline,enews_show_99_baseline,sundaytalkshow_1_baseline,sundaytalkshow_2_baseline,sundaytalkshow_3_baseline,sundaytalkshow_4_baseline,sundaytalkshow_5_baseline,sundaytalkshow_99_baseline,dailytalkshow_1_baseline,dailytalkshow_2_baseline,dailytalkshow_3_baseline,dailytalkshow_4_baseline,dailytalkshow_5_baseline,dailytalkshow_6_baseline,dailytalkshow_7_baseline,dailytalkshow_8_baseline,dailytalkshow_9_baseline,dailytalkshow_99_baseline,latetalk_1_baseline,latetalk_2_baseline,latetalk_3_baseline,latetalk_4_baseline,latetalk_5_baseline,latetalk_6_baseline,latetalk_7_baseline,latetalk_8_baseline,latetalk_9_baseline,latetalk_10_baseline,latetalk_99_baseline,localeve_baseline,localnewspaper_baseline,ideo5_baseline,imiss_a_baseline,imiss_b_baseline,imiss_c_baseline,imiss_d_baseline,imiss_f_baseline,imiss_g_baseline,imiss_h_baseline,imiss_j_baseline,imiss_m_baseline,imiss_p_baseline,imiss_q_baseline,imiss_r_baseline,imiss_s_baseline,imiss_t_baseline,imissf_baseline,imissf2_baseline,immi_contribution_baseline,immi_naturalize_baseline,immi_makedifficult_baseline,abortview3_baseline,gaymar2_baseline,deathpenalty_baseline,deathpenfreq_baseline,taxwealth_baseline,univhealthcov_baseline,healthtaxch3_baseline,healthqualch3_baseline,healthreformbill_baseline,envwarm_baseline,envser2_baseline,envpoll2_baseline,affirmact_gen_baseline,tradepolicy_baseline,govt_reg_baseline,pid7_baseline,pid3_t_baseline,pid3_baseline,pid7others_baseline,vote_generic_baseline,match_generic_t_baseline,cong2012_2_baseline,cong2012_2_t_baseline,marstat_baseline,partyid_sp_baseline,polinterest_baseline,pol_know_baseline,pk_ideo_baseline,pk_house_baseline,pk_senate_baseline,pk_hminl_baseline,pk_speaker_baseline,pk_hmajl_baseline,pk_sminl_baseline,pk_vp_baseline,pk_smajl_baseline,pk_scj_baseline,teapartymemb_baseline,teapartsup_baseline,selfdescr_ccap_1_baseline,selfdescr_ccap_2_baseline,selfdescr_ccap_3_baseline,selfdescr_ccap_4_baseline,selfdescr_ccap_5_baseline,selfdescr_ccap_6_baseline,selfdescr_ccap_7_baseline,selfdescr_ccap_8_baseline,selfdescr_ccap_9_baseline,selfdescr_ccap_10_baseline,selfdescr_ccap_11_baseline,selfdescr_ccap_12_baseline,selfdescr_ccap_13_baseline,selfdescr_ccap_99_baseline,abortidentity_baseline,race_deservemore_baseline,race_overcome_baseline,race_tryharder_baseline,race_slave_baseline,therm_baseline,blacks_t_baseline,whites_t_baseline,asians_t_baseline,latinos_t_baseline,christians_t_baseline,jews_t_baseline,muslims_t_baseline,mormons_t_baseline,gays_t_baseline,add_confirm_baseline,inputzip_baseline,votereg_baseline,regzip_baseline,votereg_f_baseline,regzip2_baseline,votereg_fnd_baseline,inputstate_baseline,region_baseline,urbancity_baseline,urbancity_t_baseline,ownorrent_baseline,ownhome_t_baseline,lengthres_baseline,partyreg_baseline,partyreg_t_baseline,reliablevoter_baseline,straighttic_baseline,voted08_ccap_baseline,presvote08_baseline,otpresvote08_baseline,vote10_baseline,congvote10_ccap_baseline,fav_romn_baseline,fav_ging_baseline,fav_hunt_baseline,fav_bach_baseline,fav_ronp_baseline,fav_sant_baseline,fav_perr_baseline,fav_obama_baseline,fav_hrc_baseline,fav_biden_baseline,ideoobama_baseline,saysobama_baseline,likeobama_baseline,ideonewt_baseline,saysnewt_baseline,likenewt_baseline,ideoromney_baseline,saysromney_baseline,likeromney_baseline,repchoice_baseline,repnom_baseline,repnom_t_baseline,repnom_f_baseline,repnom_f_t_baseline,cmatch_romn_baseline,cmatch_romn_t_baseline,cmatch_romn_f_baseline,cmatch_ging_baseline,cmatch_ging_t_baseline,cmatch_ging_f_baseline,cmatch_paul_baseline,cmatch_paul_t_baseline,cmatch_paul_f_baseline,org_membership_1_baseline,org_membership_2_baseline,org_membership_3_baseline,org_membership_4_baseline,org_membership_5_baseline,org_membership_6_baseline,org_membership_7_baseline,org_membership_8_baseline,org_membership_9_baseline,org_membership_10_baseline,org_membership_11_baseline,org_membership_12_baseline,org_membership_13_baseline,org_membership_14_baseline,org_membership_15_baseline,org_membership_16_baseline,org_membership_17_baseline,org_membership_18_baseline,org_membership_19_baseline,org_membership_20_baseline,org_membership_21_baseline,volunteer_baseline,volunteerf_baseline,volunteernum_baseline,volunteerorg2_1_baseline,volunteerorg2_2_baseline,volunteerorg2_3_baseline,volunteerorg2_4_baseline,volunteerorg2_5_baseline,volunteerorg2_6_baseline,volunteerorg2_7_baseline,volunteerorg2_8_baseline,volunteerorg2_9_baseline,volunteerorg2_10_baseline,volunteerorg2_11_baseline,volunteerorg2_12_baseline,volunteerorg2_13_baseline,volunteerorg2_14_baseline,volunteerorg2_15_baseline,volunteerorg2_16_baseline,volunteerorg2_17_baseline,polcontr_t_baseline,polcontr_1_baseline,polcontr_2_baseline,polcontr_3_baseline,polcontr_4_baseline,polcontr_5_baseline,polcontr_6_baseline,polcontr_7_baseline,labunmemb_baseline,pew_bornagain_baseline,pew_religimp_baseline,pew_churatd_baseline,pew_prayer_baseline,religpew_baseline,religpew_t_baseline,religpew_protestant_baseline,religpew_protestant_t_baseline,xreligpew_protestant_baseline,religpew_baptist_baseline,religpew_baptist_t_baseline,religpew_methodist_baseline,religpew_methodist_t_baseline,religpew_nondenom_baseline,religpew_nondenom_t_baseline,religpew_lutheran_baseline,religpew_lutheran_t_baseline,religpew_presby_baseline,religpew_presby_t_baseline,religpew_pentecost_baseline,religpew_pentecost_t_baseline,religpew_episcop_baseline,religpew_episcop_t_baseline,religpew_christian_baseline,religpew_christian_t_baseline,religpew_congreg_baseline,religpew_congreg_t_baseline,religpew_holiness_baseline,religpew_holiness_t_baseline,religpew_reformed_baseline,religpew_reformed_t_baseline,religpew_advent_baseline,religpew_advent_t_baseline,religpew_catholic_baseline,religpew_catholic_t_baseline,religpew_mormon_baseline,religpew_mormon_t_baseline,religpew_orthodox_baseline,religpew_orthodox_t_baseline,religpew_jewish_baseline,religpew_jewish_t_baseline,religpew_muslim_baseline,religpew_muslim_t_baseline,religpew_buddhist_baseline,religpew_buddhist_t_baseline,religpew_hindu_baseline,religpew_hindu_t_baseline,milstat_1_baseline,milstat_2_baseline,milstat_3_baseline,milstat_4_baseline,milstat_5_baseline,milstat_insert_baseline,gunown_baseline,smoke100_baseline,smokenow_baseline,healthdk_0_baseline,healthcov2_baseline,healthcov_t_baseline,knowgay4_baseline,closegay4_baseline,birthyr_baseline,gender_baseline,race_baseline,race_other_baseline,educ_baseline,child18_baseline,child18num_baseline,child_age1_1_baseline,child_age2_1_baseline,child_age3_1_baseline,child_age4_1_baseline,child_age5_1_baseline,child_age6_1_baseline,child_age7_1_baseline,child_age8_1_baseline,child_age9_1_baseline,child_age10_1_baseline,student2_baseline,job_baseline,employstat2_t_baseline,employstat2_baseline,industry_baseline,industry_former_baseline,naics3_t_baseline,naics3_baseline,occupationcat_baseline,occupationother_baseline,hourscomputing_baseline,intuse_else_baseline,intuse_home_baseline,intuse_mobile_baseline,intuse_work_baseline,intuse2_home_baseline,intuse2_work_baseline,intuse2_cafe_baseline,intuse2_mobile_baseline,intuse2_else_baseline,daily_intuse_home_baseline,daily_intuse_work_baseline,daily_intuse_cafe_baseline,daily_intuse_mobile_baseline,daily_intuse_else_baseline,employ_spouse_baseline,employ_spouse_t_baseline,phone_baseline,faminc_baseline,cand_baseline,cdid_baseline,demnom2_baseline,demnom_t_baseline,izip_baseline,lookupzip_baseline,prim12_baseline,statefips_baseline,ccap2012_post_2016,post_inputstate_2012,post_cdid113_2012,post_turnout12_2012,post_turnout_method12_2012,post_presvote12_2012,post_presvote12_other_2012,post_senvote12_2012,post_senvote12_other_2012,post_house12_2012,post_housevote12_other_2012,post_pid7_2012,post_pid3_t_2012,post_pid3_2012,post_ideo5_2012,post_newsint_2012,post_housecand1name_2012,post_housecand1party_2012,post_housecand2name_2012,post_housecand2party_2012,post_housecand3name_2012,post_housecand3party_2012,post_sencand1name_2012,post_sencand1party_2012,post_sencand2name_2012,post_sencand2party_2012,post_sencand3name_2012,post_sencand3party_2012,starttime_2016,endtime_2016
0,779,0.358213,Republican Party,In the Democratic primary,Hillary Clinton,,California,94952,Yes,Yes,,Yes,,By mail,Hillary Clinton,__NA__,,Vote in favor,Hillary Clinton (Democratic),Hillary Clinton (Democratic),Bernie Sanders (Democratic),Bernie Sanders (Democratic),,No,,__NA__,Very confident,Not too confident,Strongly Approve,Very unfavorable,Very unfavorable,Somewhat unfavorable,Somewhat unfavorable,Very favorable,Very favorable,Very favorable,Somewhat unfavorable,,,,,,,,,,,,,About the same,Somewhat more,Much less,Somewhat more,About the same,Much more,Much more,Much less,About the same,Much more,About the same,Much more,Disagree,Strongly disagree,Strongly agree,Strongly disagree,Disagree,Agree,Off on the wrong track,About the same as now,Getting better,Better,Don't know,Should be more evenly distributed,Holding steady,As respected as in the past,Some of the time,Don't know,People try to be helpful,Don't know,95,94,90,90,89,94,50 - No feeling at all,100 - Favorable feeling,89,79,21,99,78,89,2,Somewhat important,Somewhat important,Very important,Very important,Very important,Somewhat important,Very important,Very important,Somewhat important,Very important,Very important,Very important,Very important,Very important,Somewhat important,Somewhat important,Very important,Somewhat important,Very important,Very important,Somewhat important,Very important,Very important,Mostly make a contribution,Favor,Slightly easier,Strongly oppose,Legal in all cases,Favor,Should be allow to us the restrooms of the gen...,Opposed to the death penalty,Too often,Don't know,"Having 20,000 people in prison who are actuall...",Yes,Expanded,Definitely is happening,Pollution from human activities,Favor,Yes,Too little,We need a strong government to handle today's ...,Favor,No impact,No impact,Increase,No impact,Increase,Agree strongly,Agree,Disagree,Somewhat proud,Not very proud,Not very proud,Not very important,Very important,Don't know,Fairly important,Not important at all,Very important,Not important at all,Very important,Strongly Disagree,Strongly Disagree,Strongly Agree,Strongly Disagree,Strongly Disagree,Strongly Agree,Don't know,Agree,Strongly Disagree,Strongly Disagree,Agree,Treat both groups the same,Strongly Disagree,Disagree,Strongly agree,Strongly agree,Strongly disagree,Strongly disagree,Respect for elders,Curiosity,Self reliance,Considerate,Once or twice a month,"Even if some people are offended, Americans ne...",White,__NA__,Not very much,Not at all important,No one in my household belongs to a union,No,No,No,Yes,No,No one in the household owns a gun,Yes,Not at all,Yes,"I'm covered by a government plan, such as Medi...",__NA__,No,No,No,Very Unlikely,4-year,Widowed,No,Retired,__NA__,Prefer not to say,Democrat,__NA__,Not very strong Democrat,Moderate,Most of the time,No,Not too important,Seldom,Seldom,Roman Catholic,__NA__,__NA__,__NA__,__NA__,"reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])",__NA__,"reverse(1, [3,2,1,0])","randomize(27327, [5,4,7,2,6,1,3,0])","reverse(1, [3,2,1,0])",__NA__,"randomize(299084849, [2,7,5,0,11,10,1,8,4,6,9,3])","randomize(508, [2,5,0,4,3,1])","reverse(1, [1,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [1,0])","reverse(0, [0,1,2])","reverse(0, [0,2])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(0, [0,1])","randomize(120113210084, [9,8,11,4,0,7,6,3,13,1...","randomize(1826312573888154007586, [7,8,14,4,16...","reverse(0, [0,1,2,3])","reverse(0, [0,2])","reverse(1, [1,0])","reverse(1, [4,3,2,1,0])","reverse(1, [3,2,1,0])","reverse(0, [0,1,2])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [2,1,0])","reverse(0, [0,1,2,3])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","randomize(44, [3,2,1,4,0])","randomize(4, [2,1,0])","randomize(0, [0,1,2])","randomize(34872, [6,7,2,5,1,3,0,4])","randomize(73, [1,4,2,3,0,5])","reverse(0, [0,2])","randomize(14, [0,3,1,2])","randomize(19, [3,0,2,1])","randomize(0, [0,1,2,3])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [2,1,0])",Most of the time,Generally headed in the right direction,Some of the time,About the same as now,Getting better,Disagree somewhat,Somewhat Approve,3 - 4 hours,No,No,No,No,No,Yes,No,No,No,Yes,No,Yes,No,No,No,Yes,No,No,No,No,No,No,No,No,No,No,No,No,No,No,Yes,No,No,No,No,Yes,Yes,Yes,No,No,No,No,five,none,Moderate,Unimportant,Very Important,Somewhat Important,Somewhat Important,Somewhat Important,Very Important,Very Important,Very Important,Very Important,Very Important,Very Important,Very Important,Very Important,Not very Important,Education,,Mostly make a contribution,Favor,Slightly easier,Legal in all cases,Favor,Opposed to the death penalty,Too often,Favor,Yes,About the same,About the same,Expanded,Definitely is happening,Very serious,Pollution from human activities,Favor,Favor,Too little,Not very strong Democrat,__NA__,Democrat,,The Democratic Party candidate,,The Democratic Party candidate,,Widowed,,Very much interested,A lot,Republican Party,Republican Party,Democratic Party,Representative,Representative,Representative,Senator,Vice President,Senator,Judge,No,Strongly oppose,No,No,No,No,No,Yes,No,No,No,Yes,No,No,No,No,Pro-choice,Agree,Disagree,Strongly Disagree,Agree,1.0,60.0,59.0,65.0,61.0,63.0,61.0,61.0,60.0,70.0,,89052.0,Yes,,Yes,,,Nevada,West,Suburb,,Owned by you or your family,,3-4 years,,__NA__,Always,Vote for both Democrats and Republicans,Yes,Barack Obama,,Yes,Democratic candidate,Somewhat unfavorable,Very unfavorable,Somewhat favorable,Very unfavorable,Somewhat unfavorable,Very unfavorable,Very unfavorable,Very favorable,Very favorable,Very favorable,Moderate,Says what he believes,Like a lot,Conservative,Says what he thinks people want to hear,Dislike,Conservative,Says what he thinks people want to hear,Not sure,Compromises to get things done.,No preference,__NA__,,__NA__,Barack Obama,__NA__,,Barack Obama,__NA__,,,__NA__,,No,No,Yes,No,Yes,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,Yes,,1.0,No,No,No,No,No,No,Yes,No,No,No,No,No,No,No,No,No,No,__NA__,Yes,No,No,Yes,No,No,No,No one in my household belongs to a union,No,Somewhat important,Seldom,Once a day,Roman Catholic,,,__NA__,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,Roman Catholic Church,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,No,No,No,Yes,No,__NA__,No one in the household owns a gun,Yes,Not at all,Yes,"I'm covered by a government plan, such as Medi...",,Yes,Member of my family,1931,Female,White,,4-year,No,,,,,,,,,,,,Not a student,,__NA__,Retired,,Information,__NA__,,Middle Management,,5.0,,,,,Several times a day,,Never,Never,Never,3-6 hours per day,,,,,,__NA__,Both,"$50,000 - $59,999",258342,3.0,Barack Obama,,89052.0,89052,Democratic primary or caucus,32.0,Yes,Nevada,3,I definitely voted in the General Election on ...,In person before election day (early),Barack Obama,__NA__,$SenCand1Name ($SenCand1Party),__NA__,$HouseCand1Name ($HouseCand1Party),__NA__,Not very strong Democrat,__NA__,Democrat,Moderate,Most of the time,John Oceguera,Democratic,Joe Heck,Republican,,,Shelley Berkley,Democratic,Dean Heller,Republican,,,29nov2016 22:59:43,29nov2016 23:28:24
1,2108,0.562867,Republican Party,In the Republican primary,,Donald Trump,Arizona,85298,Yes,Yes,,Yes,,In person before the election,Donald Trump,__NA__,,Vote in favor,Marco Rubio (Republican),Ted Cruz (Republican),Donald Trump (Republican),Marco Rubio (Republican),,No,,__NA__,Very confident,Very confident,Strongly Disapprove,Very favorable,Very favorable,Very favorable,Very favorable,Very unfavorable,Very unfavorable,Very unfavorable,Very favorable,,,,,,,,,,,,,Much more,Much more,Much more,Much more,Somewhat more,Much less,About the same,About the same,Much more,Somewhat less,Much more,Much more,Agree,Strongly agree,Disagree,Strongly agree,Disagree,Agree,Off on the wrong track,Worse off financially,Getting worse,Better,Better than R's,Distribution is fair,Generally becoming rarer and less accepted,Less respected,Some of the time,Most people can be trusted,People try to be helpful,People would try to be fair,97,99,100 - Favorable feeling,100 - Favorable feeling,75 - Favorable feeling,97,100 - Favorable feeling,52,97,29,75 - Favorable feeling,84,48,97,51,Very important,Very important,Somewhat important,Somewhat important,Very important,Very important,Unimportant,Somewhat important,Somewhat important,Very important,Somewhat important,Unimportant,Somewhat important,Somewhat important,Very important,Very important,Very important,Very important,Somewhat important,Very important,Somewhat important,Not very important,Unimportant,Neither,Don't know,No change,Don't know,Legal/Illegal in some cases,Oppose,Should be required to use the restrooms of the...,Favor the death penalty,Not often enough,Isolated incidents,"Having 20,000 people in prison who are actuall...",No,Repealed,Definitely is not happening,,Oppose,No,Too much,People would be better able to handle today's ...,Favor,Decrease,Decrease,Increase,No impact,Decrease,Agree strongly,Agree,Agree,Somewhat proud,Somewhat proud,Somewhat proud,Not important at all,Very important,Not important at all,Very important,Fairly important,Very important,Not important at all,Very important,Somewhat Agree,Strongly Agree,Somewhat Agree,Somewhat Agree,Somewhat Disagree,Somewhat Agree,Men have more opportunities than women,Disagree,Strongly Agree,Agree,Strongly Disagree,Treat both groups the same,Agree,Agree,Strongly agree,Strongly agree,Strongly agree,Disagree,Respect for elders,Good manners,Self reliance,Considerate,Seldom,"Even if some people are offended, Americans ne...",White,__NA__,Not very much,Very important,No one in my household belongs to a union,No,No,No,Yes,No,Personally own a gun,No,,Yes,I have private insurance or belong to an HMO.,__NA__,Yes,Yes,Yes,Very Unlikely,Some college,Married,No,Permanently disabled,__NA__,"$60,000 - $69,999",Republican,__NA__,Strong Republican,Conservative,Most of the time,No,Very important,More than once a week,Several times a day,Mormon,__NA__,__NA__,__NA__,__NA__,"reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])",__NA__,"reverse(1, [3,2,1,0])","randomize(80, [0,4,3,1,2,5,6,7])","reverse(1, [3,2,1,0])",__NA__,"randomize(409649629, [7,11,6,0,1,3,2,4,10,8,5,9])","randomize(20, [3,2,1,0,4,5])","reverse(0, [0,1])","reverse(0, [0,2])","reverse(0, [0,2])","reverse(0, [0,2])","reverse(0, [0,2])","reverse(0, [0,1])","reverse(1, [2,1,0])","reverse(0, [0,2])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","randomize(355278854180, [3,2,1,11,4,10,9,0,5,8...","randomize(1272299552368081230432, [19,8,20,16,...","reverse(1, [3,2,1,0])","reverse(0, [0,2])","reverse(1, [1,0])","reverse(0, [0,1,2,3,4])","reverse(1, [3,2,1,0])","reverse(1, [2,1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [2,1,0])","reverse(0, [0,1,2,3])",__NA__,"reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","randomize(34, [2,1,3,4,0])","randomize(4, [2,1,0])","randomize(1, [1,0,2])","randomize(39343, [7,6,5,2,1,3,0,4])","randomize(511, [1,5,3,4,2,0])","reverse(0, [0,2])","randomize(2, [0,2,1,3])","randomize(10, [2,1,3,0])","randomize(6, [0,1,3,2])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(0, [0,1,2])",Most of the time,Off on the wrong track,Some of the time,Better off financially,About the same,Disagree strongly,Strongly Disapprove,More than 4 hours,No,No,No,No,No,No,Yes,Yes,Yes,Yes,Yes,Yes,No,Yes,No,No,No,No,No,No,Yes,Yes,Yes,Yes,No,No,Yes,No,No,Yes,No,No,No,No,No,No,No,No,No,Yes,Yes,No,four,everyday,Very Conservative,Very Important,Very Important,Very Important,Unimportant,Very Important,Somewhat Important,Not very Important,Very Important,Somewhat Important,Very Important,Very Important,Very Important,Very Important,Very Important,The economy,,Mostly a drain,Not sure,No change,Legal in some cases and illegal in others,Oppose,Favor the death penalty,Not often enough,Oppose,No,Pay more,Worse care,Repealed,Definitely is not happening,,,Oppose,Favor,Too much,Strong Republican,__NA__,Republican,,The Republican Party candidate,,The Republican Party candidate,,Married,Republican,Very much interested,A lot,Republican Party,Republican Party,Democratic Party,Senator,Senator,Representative,Senator,Vice President,Senator,Judge,Yes,Strongly support,No,No,No,No,No,Yes,Yes,No,No,Yes,Yes,No,No,No,Pro-life,Strongly Disagree,Strongly Agree,Agree,Strongly Disagree,1.0,100.0,89.0,98.0,100.0,100.0,97.0,66.0,99.0,92.0,Yes,,Yes,,Yes,,,Arizona,West,Rural area,,Rented from someone else,,5-10 years,Republican,,Always,Vote for both Democrats and Republicans,Yes,John McCain,__NA__,,Republican candidate,Very favorable,Somewhat favorable,Somewhat favorable,Very favorable,Somewhat unfavorable,Very favorable,Somewhat favorable,Very unfavorable,Somewhat unfavorable,Somewhat unfavorable,Very liberal,Says what he thinks people want to hear,Like somewhat,Moderate,Says what he believes,Like somewhat,Conservative,Says what he believes,Like a lot,"Sticks to their principles, no matter what.",Mitt Romney,__NA__,Rick Santorum,__NA__,Mitt Romney,__NA__,,Newt Gingrich,__NA__,,,__NA__,,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,Yes,Yes,,1.0,Yes,Yes,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,__NA__,No,No,No,No,No,No,Yes,No one in my household belongs to a union,No,Very important,More than once a week,Several times a day,Mormon,,,__NA__,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,The Church of Jesus Christ of Latter-day Saints,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,No,No,No,Yes,No,__NA__,Personally own a gun,No,,Yes,I have private insurance or belong to an HMO.,,Yes,Member of my family,1952,Female,White,,Some college,No,,,,,,,,,,,,Not a student,,__NA__,Permanently disabled,,,__NA__,,Retired,,2.0,Several times a day,Never,3-5 days a week,,,,,,,1-2 hours per day,,,,,Full-time,,Both,"$70,000 - $79,999",317635,6.0,Not sure,,85298.0,85298,Republican primary or caucus,4.0,Yes,Arizona,5,I definitely voted in the General Election on ...,In person before election day (early),Mitt Romney,__NA__,$SenCand2Name ($SenCand2Party),__NA__,$HouseCand2Name ($HouseCand2Party),__NA__,Strong Republican,__NA__,Republican,Conservative,Most of the time,Spencer Morgan,Democratic,Matt Salmon,Republican,,,Richard Carmona,Democratic,Jeff Flake,Republican,,,29nov2016 15:41:28,29nov2016 18:58:28
2,2597,0.552138,Republican Party,In the Democratic primary,Hillary Clinton,,Wisconsin,54904,Yes,Yes,,Yes,,In person before the election,Hillary Clinton,__NA__,,Vote in favor,Hillary Clinton (Democratic),Hillary Clinton (Democratic),Bernie Sanders (Democratic),Bernie Sanders (Democratic),,No,,__NA__,Not too confident,Not too confident,Strongly Approve,Very unfavorable,Very unfavorable,Very unfavorable,Very unfavorable,Very favorable,Very favorable,Somewhat favorable,Very unfavorable,,,,,,,,,,,,,About the same,Somewhat more,Somewhat less,Much less,Much more,Much more,Much more,Somewhat less,Somewhat more,About the same,About the same,Somewhat more,Agree,Strongly disagree,Strongly agree,Strongly disagree,Strongly agree,Strongly agree,Generally headed in the right direction,Worse off financially,Getting worse,Better,Better than R's,Should be more evenly distributed,Generally becoming rarer and less accepted,More respected,Some of the time,Can't be too careful in dealing with people,People are looking out for themselves,People would try to take advantage,77,83,77,90,51,75 - Favorable feeling,50 - No feeling at all,69,75 - Favorable feeling,89,25 -Unfavorable feeling,50 - No feeling at all,99,94,0 - Unfavorable feeling,Very important,Very important,Somewhat important,Very important,Not very important,Very important,Not very important,Somewhat important,Unimportant,Very important,Very important,Very important,Very important,Very important,Very important,Somewhat important,Very important,Very important,Very important,Not very important,Somewhat important,Very important,Somewhat important,Mostly make a contribution,Favor,Slightly harder,Somewhat oppose,Legal in all cases,Favor,Should be allow to us the restrooms of the gen...,Favor the death penalty,Not often enough,Isolated incidents,"Having 20,000 people in prison who are actuall...",Yes,Expanded,Definitely is happening,Pollution from human activities,Favor,Yes,Too little,We need a strong government to handle today's ...,Favor,Decrease,No impact,Decrease,Increase,No impact,Agree strongly,Agree,Agree strongly,Very proud,Very proud,Somewhat proud,Not very important,Very important,Very important,Very important,Not important at all,Very important,Not very important,Very important,Strongly Disagree,Somewhat Disagree,Strongly Agree,Somewhat Disagree,Strongly Disagree,Strongly Agree,Men have more opportunities than women,Disagree,Agree,Strongly Agree,Strongly Disagree,Treat both groups the same,Disagree,Agree,Agree,Agree,Disagree,Disagree,,Good manners,,Well behaved,Never,People need to be more careful about the langu...,White,__NA__,Some,Very important,No one in my household belongs to a union,No,No,Yes,No,No,Personally own a gun,No,,Yes,"I'm covered by a government plan, such as Medi...",__NA__,No,No,No,Somewhat Likely,High school graduate,Single,No,Retired,__NA__,"$50,000 - $59,999",Independent,__NA__,Lean Democrat,Moderate,Most of the time,No,Not at all important,Seldom,A few times a week,Roman Catholic,__NA__,__NA__,__NA__,__NA__,"reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])",__NA__,"reverse(0, [0,1,2,3])","randomize(29951, [6,0,7,2,1,4,3,5])","reverse(0, [0,1,2,3])",__NA__,"randomize(201571018, [2,5,4,0,9,7,11,6,3,8,10,1])","randomize(471, [4,3,5,2,1,0])","reverse(1, [1,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [1,0])","reverse(1, [2,1,0])","reverse(1, [2,0])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(1, [1,0])","randomize(1117654743898, [2,8,14,9,10,0,12,6,1...","randomize(7611805231108026090267, [20,5,18,4,1...","reverse(1, [3,2,1,0])","reverse(0, [0,2])","reverse(0, [0,1])","reverse(1, [4,3,2,1,0])","reverse(0, [0,1,2,3])","reverse(0, [0,1,2])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(1, [2,1,0])","reverse(1, [3,2,1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","randomize(99, [4,2,0,3,1])","randomize(1, [1,0,2])","randomize(0, [0,1,2])","randomize(31691, [2,7,3,1,6,5,4,0])","randomize(518, [0,5,1,4,2,3])","reverse(0, [0,2])","randomize(8, [0,2,3,1])","randomize(9, [1,2,3,0])","randomize(9, [1,2,3,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [2,1,0])",Most of the time,Generally headed in the right direction,Most of the time,Worse off financially,Getting better,Agree strongly,Somewhat Approve,3 - 4 hours,No,No,No,No,No,Yes,No,Yes,No,No,No,No,No,No,No,No,No,No,No,Yes,No,No,No,No,Yes,Yes,No,No,No,No,No,No,No,No,No,No,Yes,Yes,No,No,No,No,everyday,everyday,Moderate,Unimportant,Very Important,Unimportant,Not very Important,Somewhat Important,Unimportant,Somewhat Important,Very Important,Very Important,Somewhat Important,Not very Important,Very Important,Very Important,Unimportant,The economy,,Mostly make a contribution,Favor,Much easier,Legal in all cases,Favor,Favor the death penalty,Not often enough,Favor,Yes,Pay less,Better care,Expanded,Definitely is happening,Very serious,Pollution from human activities,Favor,Favor,Too little,Lean Democrat,__NA__,Independent,,The Democratic Party candidate,,The Democratic Party candidate,,Single,,Very much interested,A lot,Republican Party,Republican Party,Democratic Party,Representative,Senator,Representative,Senator,Vice President,Senator,Judge,No,Strongly oppose,No,No,No,No,No,Yes,No,No,No,No,No,No,No,No,Neither,Agree,Disagree,Disagree,Agree,1.0,91.0,100.0,96.0,100.0,65.0,41.0,6.0,21.0,99.0,Yes,,Yes,,Yes,,,Wisconsin,Midwest,City,,Owned by you or your family,,More than 10 years,,__NA__,Always,Vote for both Democrats and Republicans,Yes,Barack Obama,,Yes,Democratic candidate,Very unfavorable,Somewhat unfavorable,Somewhat favorable,Very unfavorable,Very unfavorable,Somewhat favorable,Somewhat favorable,Somewhat favorable,Very favorable,Somewhat favorable,Liberal,Says what he believes,Like a lot,Very conservative,Says what he believes,Dislike,Moderate,Says what he thinks people want to hear,Dislike,Compromises to get things done.,Jon Huntsman,__NA__,,__NA__,Barack Obama,__NA__,,Barack Obama,__NA__,,Barack Obama,__NA__,,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,Yes,No,No,,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,__NA__,No,No,No,No,No,No,Yes,No one in my household belongs to a union,No,Not at all important,Seldom,Never,Agnostic,,,__NA__,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,Roman Catholic Church,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,No,No,Yes,No,No,__NA__,Personally own a gun,No,,Yes,"I'm covered by a government plan, such as Medi...",,No,,1931,Male,White,,High school graduate,No,,,,,,,,,,,,Not a student,,__NA__,Retired,,Government,__NA__,,Professional/Technical,,3.0,,,,,Several times a day,,Never,Never,Never,3-6 hours per day,,,,,,__NA__,Both,"$40,000 - $49,999",102825,6.0,Someone else,Hillery Clinton,54904.0,54904,Democratic primary or caucus,55.0,Yes,Wisconsin,6,I definitely voted in the General Election on ...,In person before election day (early),Mitt Romney,__NA__,$SenCand2Name ($SenCand2Party),__NA__,$HouseCand2Name ($HouseCand2Party),__NA__,Strong Republican,__NA__,Republican,Moderate,Most of the time,Joe Kallas,Democratic,Tom Petri,Republican,,,Tammy Baldwin,Democratic,Tommy Thompson,Republican,,,29nov2016 16:08:39,29nov2016 16:32:43
3,4148,0.207591,Democratic Party,In the Democratic primary,Someone else,,Oklahoma,74104,Yes,Yes,,Yes,,In person on election day,Gary Johnson,__NA__,,,Marco Rubio (Republican),Don't know,Bernie Sanders (Democratic),Bernie Sanders (Democratic),,No,,__NA__,Somewhat confident,Somewhat confident,Strongly Approve,Very unfavorable,Very unfavorable,Very unfavorable,Somewhat unfavorable,Very favorable,Very unfavorable,Somewhat unfavorable,Somewhat unfavorable,Somewhat less,About the same,Somewhat less,About the same,Somewhat more,About the same,Somewhat more,About the same,About the same,About the same,About the same,About the same,,,,,,,,,,,,,Strongly agree,Strongly disagree,Strongly agree,Strongly disagree,Agree,Strongly agree,Generally headed in the right direction,Better off financially,Getting better,Worse,Worse than R's,Should be more evenly distributed,Generally becoming rarer and less accepted,More respected,Some of the time,Can't be too careful in dealing with people,People try to be helpful,People would try to take advantage,99,51,100 - Favorable feeling,99,50 - No feeling at all,99,40,50 - No feeling at all,89,40,30,80,99,99,11,Very important,Somewhat important,Not very important,Very important,Very important,Somewhat important,Not very important,Somewhat important,Unimportant,Very important,Very important,Somewhat important,Somewhat important,Very important,Very important,Not very important,Somewhat important,Somewhat important,Somewhat important,Not very important,Somewhat important,Somewhat important,Not very important,Mostly make a contribution,Favor,Much easier,Strongly oppose,Legal/Illegal in some cases,Favor,Should be allow to us the restrooms of the gen...,Opposed to the death penalty,Too often,Part of a broader pattern,Don't know,Yes,Expanded,Probably is happening,Pollution from human activities,Oppose,Yes,Too little,We need a strong government to handle today's ...,Favor,,Decrease,Decrease,Decrease,Increase,Agree strongly,Agree,Disagree,Very proud,Very proud,Somewhat proud,Not important at all,Fairly important,Not important at all,Very important,Not important at all,Not very important,Not important at all,Very important,Strongly Disagree,Somewhat Agree,Somewhat Disagree,Somewhat Disagree,Somewhat Disagree,Somewhat Disagree,Women have more opportunities than men,Agree,Disagree,Strongly Disagree,Agree,Favor whites over blacks,Disagree,Strongly Agree,Agree,Disagree,Disagree,Strongly agree,Respect for elders,Good manners,Obedience,Well behaved,Seldom,"Even if some people are offended, Americans ne...",White,__NA__,Some,Not at all important,No one in my household belongs to a union,No,No,Yes,Yes,No,No one in the household owns a gun,No,,Yes,I have private insurance or belong to an HMO.,__NA__,No,No,No,Somewhat Unlikely,Some college,Divorced,No,Full-time,__NA__,"$70,000 - $79,999",Independent,__NA__,Lean Democrat,Moderate,Most of the time,No,Not too important,Seldom,A few times a week,Nothing in particular,__NA__,__NA__,__NA__,__NA__,"reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])",__NA__,"reverse(1, [3,2,1,0])","randomize(19121, [2,6,5,4,7,1,3,0])","reverse(1, [3,2,1,0])","randomize(171666623, [5,6,1,7,4,3,9,11,8,0,2,10])",__NA__,"randomize(85, [1,4,2,0,3,5])","reverse(1, [1,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [2,0])","reverse(1, [1,0])","reverse(1, [2,1,0])","reverse(1, [2,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(0, [0,1])","randomize(402659440223, [3,0,5,2,12,13,6,1,9,4...","randomize(20783110061102022352439, [17,0,1,5,2...","reverse(0, [0,1,2,3])","reverse(1, [2,0])","reverse(1, [1,0])","reverse(0, [0,1,2,3,4])","reverse(1, [3,2,1,0])","reverse(1, [2,1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [2,1,0])","reverse(1, [3,2,1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","randomize(92, [3,4,1,0,2])","randomize(0, [0,1,2])","randomize(3, [1,2,0])","randomize(20669, [2,5,1,7,3,0,6,4])","randomize(107, [4,0,3,1,2,5])","reverse(1, [2,0])","randomize(5, [2,0,1,3])","randomize(15, [1,3,0,2])","randomize(6, [0,1,3,2])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(0, [0,1,2])",Most of the time,Generally headed in the right direction,Most of the time,About the same as now,Getting better,Agree somewhat,Strongly Approve,More than 4 hours,No,No,No,No,No,Yes,No,No,No,No,No,Yes,Yes,Yes,No,Yes,Yes,Yes,Yes,Yes,No,No,No,No,Yes,Yes,Yes,Yes,Yes,Yes,No,No,No,No,No,No,No,No,No,No,No,No,,none,Moderate,Not very Important,Very Important,Very Important,Somewhat Important,Somewhat Important,Somewhat Important,Not very Important,Very Important,Somewhat Important,Very Important,Somewhat Important,Very Important,Somewhat Important,Unimportant,The economy,,Mostly make a contribution,Favor,Much easier,Legal in some cases and illegal in others,Favor,Favor the death penalty,About right,Favor,Yes,Pay less,About the same,Expanded,Definitely is happening,Somewhat serious,Pollution from human activities,Favor,Favor,About the right amount,Independent,__NA__,Independent,,The Democratic Party candidate,,Other,,Divorced,,Very much interested,A lot,Not sure,Republican Party,Democratic Party,Representative,Representative,Representative,Senator,Vice President,Senator,Judge,No,Strongly oppose,Yes,No,No,No,No,Yes,No,No,Yes,Yes,No,No,No,No,Both pro-life and pro-choice,Agree,Agree,Strongly Disagree,Agree,1.0,100.0,100.0,100.0,100.0,40.0,100.0,100.0,100.0,96.0,Yes,,Yes,,Yes,,,Oklahoma,South,City,,Owned by you or your family,,More than 10 years,Declined to State/Independent/No Party,,Always,Vote for both Democrats and Republicans,Yes,Barack Obama,,Yes,Democratic candidate,Somewhat unfavorable,Very unfavorable,Very favorable,Very unfavorable,Somewhat favorable,Very unfavorable,Very unfavorable,Very favorable,Somewhat unfavorable,Very favorable,Moderate,Says what he believes,Like a lot,Conservative,Says what he believes,Dislike,Moderate,Says what he thinks people want to hear,Dislike,Compromises to get things done.,Jon Huntsman,__NA__,,__NA__,Barack Obama,__NA__,,Barack Obama,__NA__,,,__NA__,,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,Yes,Yes,,3.0,No,No,No,No,Yes,No,No,No,No,No,No,No,No,No,No,No,Yes,__NA__,Yes,No,No,No,No,No,No,No one in my household belongs to a union,No,Not at all important,Seldom,A few times a month,Nothing in particular,,,__NA__,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,No,No,Yes,No,No,__NA__,No one in the household owns a gun,No,,Yes,I have private insurance or belong to an HMO.,,Yes,Member of my family,1959,Male,White,,Some college,No,,,,,,,,,,,,Not a student,,__NA__,Full-time employed,Information,,__NA__,"Data Processing, Hosting and Related Services",Professional/Technical,,12.0,Several times a day,Never,Several times a day,Never,,,,,,3-6 hours per day,More than 6 hours per day,,,,,__NA__,Both,"$80,000 - $99,999",45897,1.0,Barack Obama,,74104.0,74104,Don't plan to vote in a primary or caucus at all,40.0,Yes,Oklahoma,1,I definitely voted in the General Election on ...,In person on election day at a precinct pollin...,Barack Obama,__NA__,,__NA__,Other,,Independent,__NA__,Independent,Moderate,Most of the time,John Olson,Democratic,Jim Bridenstine,Republican,,,,,,,,,14dec2016 18:46:33,14dec2016 19:11:20
4,4460,0.333729,Republican Party,In the Republican primary,,Marco Rubio,Texas,78253,Yes,Yes,,Yes,,In person before the election,Donald Trump,__NA__,,Vote against opponent,Marco Rubio (Republican),Ted Cruz (Republican),Donald Trump (Republican),Marco Rubio (Republican),,No,,__NA__,Very confident,Very confident,Strongly Disapprove,Somewhat favorable,Somewhat unfavorable,Somewhat favorable,Very favorable,Somewhat unfavorable,Very unfavorable,Somewhat unfavorable,Very favorable,,,,,,,,,,,,,Somewhat more,Somewhat more,About the same,Much more,Much more,Much less,Much more,Somewhat more,Much more,Much more,Much more,Somewhat more,Disagree,Strongly agree,Disagree,Strongly agree,Disagree,Agree,Off on the wrong track,About the same as now,About the same,Worse,Don't know,Distribution is fair,Generally becoming rarer and less accepted,As respected as in the past,Some of the time,Can't be too careful in dealing with people,People try to be helpful,People would try to take advantage,91,75 - Favorable feeling,90,93,65,95,91,36,90,2,30,70,30,96,1,Very important,Very important,Very important,Very important,Very important,Very important,Not very important,Very important,Somewhat important,Very important,Somewhat important,Unimportant,Very important,Very important,Very important,Very important,Somewhat important,Very important,Somewhat important,Very important,Very important,Very important,Very important,Mostly a drain,Oppose,Much harder,Don't know,Legal/Illegal in some cases,Don't know,Should be required to use the restrooms of the...,Favor the death penalty,Not often enough,Isolated incidents,"Having 20,000 people not in prison but who are...",No,Repealed,Probably is happening,Natural causes not related to human activities,Oppose,No,Too much,People would be better able to handle today's ...,Favor,No impact,No impact,No impact,No impact,No impact,Agree strongly,Agree,Agree,Very proud,Somewhat proud,Very proud,Fairly important,Very important,Not very important,Very important,Fairly important,Very important,Not very important,Very important,Strongly Disagree,Somewhat Agree,Somewhat Disagree,Somewhat Disagree,Somewhat Disagree,Somewhat Agree,Women have more opportunities than men,Don't Know,Agree,Don't Know,Strongly Disagree,Don't know,Agree,Strongly Agree,Agree,Strongly agree,Agree,Disagree,Respect for elders,Curiosity,Obedience,Considerate,A few times a year,"Even if some people are offended, Americans ne...",White,__NA__,Some,Moderately important,No one in my household belongs to a union,No,No,Yes,No,No,No one in the household owns a gun,Yes,Not at all,Yes,Other,Military Tricare,Yes,No,No,Somewhat Unlikely,4-year,Married,No,Full-time,__NA__,"$40,000 - $49,999",Republican,__NA__,Strong Republican,Conservative,Most of the time,No,Very important,More than once a week,Once a day,Mormon,__NA__,__NA__,__NA__,__NA__,"reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])",__NA__,"reverse(1, [3,2,1,0])","randomize(20234, [0,4,1,7,2,5,6,3])","reverse(1, [3,2,1,0])",__NA__,"randomize(420307324, [2,11,0,3,6,10,8,4,5,1,7,9])","randomize(705, [5,2,3,0,1,4])","reverse(0, [0,1])","reverse(0, [0,2])","reverse(0, [0,2])","reverse(0, [0,2])","reverse(0, [0,2])","reverse(0, [0,1])","reverse(1, [2,1,0])","reverse(0, [0,2])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","randomize(493430789459, [8,7,4,1,13,10,3,9,5,1...","randomize(18467535318159265293698, [6,10,18,12...","reverse(1, [3,2,1,0])","reverse(0, [0,2])","reverse(1, [1,0])","reverse(1, [4,3,2,1,0])","reverse(1, [3,2,1,0])","reverse(1, [2,1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(1, [2,1,0])","reverse(0, [0,1,2,3])","reverse(1, [1,0])","reverse(1, [1,0])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(1, [1,0])","randomize(42, [3,1,2,4,0])","randomize(2, [0,2,1])","randomize(2, [0,2,1])","randomize(35589, [7,2,4,5,0,1,6,3])","randomize(560, [0,5,3,1,2,4])","reverse(0, [0,2])","randomize(11, [2,0,3,1])","randomize(10, [2,1,3,0])","randomize(20, [3,2,1,0])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(0, [0,1])","reverse(1, [1,0])","reverse(0, [0,1,2])",Most of the time,Off on the wrong track,Some of the time,Worse off financially,Getting worse,Disagree somewhat,Strongly Disapprove,1 - 2 hours,Yes,No,No,No,Yes,No,No,Yes,No,No,Yes,No,No,No,No,No,No,No,No,No,Yes,Yes,Yes,Yes,No,Yes,No,No,No,No,No,No,Yes,No,Yes,No,No,Yes,No,No,No,No,everyday,three,Conservative,Very Important,Very Important,Very Important,Somewhat Important,Very Important,Not very Important,Very Important,Very Important,Somewhat Important,Very Important,Very Important,Somewhat Important,Somewhat Important,Somewhat Important,The economy,,Mostly a drain,Not sure,Slightly easier,Illegal in all cases,Oppose,Favor the death penalty,Not often enough,Oppose,No,Pay more,Worse care,Repealed,Definitely is not happening,,,Oppose,Favor,Too much,Strong Republican,__NA__,Republican,,The Republican Party candidate,,The Republican Party candidate,,Married,Republican,Very much interested,A lot,Republican Party,Republican Party,Democratic Party,Representative,Representative,Representative,Senator,Vice President,Senator,Judge,Not Sure,Somewhat support,No,No,No,No,No,No,Yes,No,No,Yes,Yes,No,No,No,Pro-life,Agree,Disagree,Agree,Disagree,1.0,62.0,88.0,62.0,79.0,100.0,67.0,62.0,97.0,59.0,Yes,,Yes,,Yes,,,Texas,South,Suburb,,Owned by you or your family,,5-10 years,,__NA__,Always,Vote for both Democrats and Republicans,Yes,,,Yes,Republican candidate,Very favorable,Somewhat unfavorable,Somewhat favorable,Somewhat favorable,Very unfavorable,Somewhat favorable,Very unfavorable,Very unfavorable,Somewhat unfavorable,Somewhat unfavorable,Very liberal,Says what he thinks people want to hear,Like somewhat,Moderate,Says what he thinks people want to hear,Dislike,Conservative,Says what he believes,Like a lot,Compromises to get things done.,Mitt Romney,__NA__,Rick Santorum,__NA__,Mitt Romney,__NA__,,Newt Gingrich,__NA__,,,__NA__,,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,Yes,No,Yes,1.0,Yes,Yes,No,No,No,No,No,No,No,No,No,No,No,No,No,No,No,__NA__,No,Yes,No,No,No,No,No,No one in my household belongs to a union,No,Very important,Once a week,A few times a week,Mormon,,,__NA__,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,The Church of Jesus Christ of Latter-day Saints,,,__NA__,,__NA__,,__NA__,,__NA__,,__NA__,No,No,Yes,No,No,__NA__,No one in the household owns a gun,Yes,Not at all,Yes,Other,TriCare,Yes,Member of my family,1952,Male,White,,4-year,No,,,,,,,,,,,,Not a student,,__NA__,Part-time employed,"Arts, Entertainment, and Recreation",,__NA__,"Performing Arts, Spectator Sports, and Related...",Professional/Technical,,3.0,Several times a day,Never,Several times a day,Several times a day,,,,,,More than 6 hours per day,,,,,Unemployed,,Both,"$100,000 - $119,999",330742,21.0,Not sure,,78148.0,78148,Republican primary or caucus,48.0,Yes,Texas,28,I definitely voted in the General Election on ...,In person before election day (early),Mitt Romney,__NA__,$SenCand2Name ($SenCand2Party),__NA__,$HouseCand2Name ($HouseCand2Party),__NA__,Strong Republican,__NA__,Republican,Conservative,Most of the time,Henry Cuellar,Democratic,William Hayward,Republican,,,Paul Sadler,Democratic,Ted Cruz,Republican,,,01dec2016 10:17:47,01dec2016 10:59:48


In [17]:
cols = [col for col in surveys.columns if 'fav' in col and '_2016' in col] 
fav = surveys[cols].copy().drop(columns={'policies_favor_2016', 'fav_grid_row_rnd_2016', 'fav_grid_col_rnd_2016'})
fav.fillna('.', inplace=True)

## agg count the freq of values
fav = fav.apply(pd.value_counts)

fav.columns = ['Trump', 'Cruz', 'Ryan', 'Romney',
               'Obama', 'Clinton', 'Sanders', 'Rubio']

## swap the col and index of df
fav = fav.T

## convert to string with '%'
total = surveys.shape[0]
fav = fav.apply(lambda x: (np.round(x / total, 2)*100).astype(int).astype(str) + '%')

## reorder cols
fav = fav[['Very favorable', 'Somewhat favorable', 'Somewhat unfavorable', 'Very unfavorable', '.']]
fav

Unnamed: 0,Very favorable,Somewhat favorable,Somewhat unfavorable,Very unfavorable,.
Trump,26%,18%,8%,45%,1%
Cruz,11%,24%,18%,40%,1%
Ryan,9%,27%,24%,32%,1%
Romney,6%,28%,35%,24%,1%
Obama,34%,15%,9%,41%,1%
Clinton,22%,20%,9%,48%,1%
Sanders,27%,26%,16%,26%,1%
Rubio,12%,30%,24%,25%,1%


In [None]:
## across all Q's
## age, gender, race, education, party ID, idealogy, 2016 vote choice, Dem vote choice, GOP vote choice
reg_col = 'votereg2_2016'
age_col = 'age'
gender_col = 'gender_baseline'
race_col = 'race_baseline'
edu_col = 'educ_baseline'
party_col = 'partyreg_baseline'
id_col = 'ideo5_2016'
vote_col = 'presvote16post_2016'
dem_col = 'pp_demprim16_2016'
gop_col = 'pp_repprim16_2016'

## create 'age' col 
tables = surveys.copy()

tables['age'] = (2016 - tables['birthyr_baseline'])

## CROSSTABS
    ## quantiles (buckets) for the ages
    ## NEED THIS FOR EITHER APPROACH
bins = [18, 30, 45, 64, np.inf]
labels = ['18-29', '30-44', '45-64', '65+']
tables['age_quant'] = pd.cut(tables['age'], bins=bins, labels=labels)

## LONG WAY
## group answers with age_quants
output = pd.DataFrame(tables.groupby('age_quant')[reg_col].value_counts()).unstack(level=[0])
## reset col names
output.columns = labels
## change col name
output.index.name = 'Voter Registration Status'
## sort index
output.sort_index(ascending=False, inplace=True)

## SHORT WAY
pd.crosstab(index=tables[reg_col], columns=tables['age_quant'])
    ## WITH %
pd.crosstab(index=tables[reg_col], columns=tables['age_quant']).apply(lambda x: (x/x.sum())*100, axis=1)

In [33]:
    ## BUCKETS/QUANTS FOR CATEGORICAL DATA
tables.groupby(gender_col)[reg_col].value_counts().unstack(level=[0])
    ## or-
pd.crosstab(index=tables[gender_col], columns=tables[reg_col]).T

gender_baseline,Female,Male
votereg2_2016,Unnamed: 1_level_1,Unnamed: 2_level_1
Don't know,13,8
No,45,25
Yes,4002,3907


# Matches btwn cols

## map to new col based on value in other cols in 1 df

In [None]:
## ref = use output from cleaning

output['age'] = output['age'].astype(int)

date_year = output['startdate'].str[-4].astype(int)
cond1 = (abs((date_year - output['d101']) - output['age']) == 1) | (abs((date_year - output['d101']) - output['age']) == 0)
cond2 = (output['sex'].map(lambda x: 2 if 'F' in x else 1) == output['d100'])

## new binary column of matches or mismatches
output['voter_file_match'] = (cond2 | (np.where(~cond1, False, True)))
output

# EDA Kickstarters

In [34]:
report = sv.analyze(q1)
report.show_html()

                                             |                                                                …

Report SWEETVIZ_REPORT.html was generated! NOTEBOOK/COLAB USERS: the web browser MAY not pop up, regardless, the report IS saved in your notebook/colab files.


# Cleaning

## split, strip values in col into new cols for each value

In [None]:
## clean cols
q1.columns = q1.columns.str.lower()

## mask col
col = q1['vf_data']
## split the data in the col
split = col.apply(lambda x: x.split(';'))

## create dictionary of split values in previous col
dct = [dict(x.split('=', 1) for x in y) for y in split]

## merge dct into data
output = q1.join(pd.DataFrame(dct)).drop(columns='vf_data')
output.columns = output.columns.str.lower()

## order cols alphabetically

In [None]:
col_order = ['origin']
new_order = col_order + (output.columns.drop(col_order).tolist())
output = output[new_order]

## BELOW
output = output.reindex(sorted(output.columns), axis=1)

#