# Voter participation in 1844 election

Solution for voter participation exercise.

In [None]:
# Read data from web URL instead of local data directory
# (so that notebook works in online version).
voter_df <- read.csv('https://resampling-stats.github.io/data/election_1844.csv')
participation <- voter_df$Participation
spread <- voter_df$Spread

In [None]:
# Compute correlation.  It's -0.425.
actual_r <- cor(participation, spread)
actual_r

In [None]:
n_trials <- 10000
results <- numeric(n_trials)

for (i in 1:n_trials) {
    # Shuffle the participation rates.
    shuffled <- sample(participation)
    # Compute re-sampled correlation.
    fake_r <- cor(shuffled, spread)
    # Keep the value in the results.
    results[i] <- fake_r
}

hist(results, breaks=25,
     main='Distribution of shuffled correlations',
     xlab='Correlation with shuffled participation')

# Count the trials when result <= observed.
k <- sum(results <= actual_r)
# Compute the proportion of such trials.
kk <- k / n_trials

message('Proportion of shuffled r <= observed: ', round(kk, 2))