# Wine Quality

## Introduction:

*Loading Libraries*

In [3]:
library(tidyverse)
library(tidymodels)
library(gridExtra)

── [1mAttaching packages[22m ─────────────────────────────────────── tidyverse 1.3.0 ──

[32m✔[39m [34mggplot2[39m 3.3.2     [32m✔[39m [34mpurrr  [39m 0.3.4
[32m✔[39m [34mtibble [39m 3.0.3     [32m✔[39m [34mdplyr  [39m 1.0.2
[32m✔[39m [34mtidyr  [39m 1.1.2     [32m✔[39m [34mstringr[39m 1.4.0
[32m✔[39m [34mreadr  [39m 1.3.1     [32m✔[39m [34mforcats[39m 0.5.0

“package ‘ggplot2’ was built under R version 4.0.1”
“package ‘tibble’ was built under R version 4.0.2”
“package ‘tidyr’ was built under R version 4.0.2”
“package ‘dplyr’ was built under R version 4.0.2”
── [1mConflicts[22m ────────────────────────────────────────── tidyverse_conflicts() ──
[31m✖[39m [34mdplyr[39m::[32mfilter()[39m masks [34mstats[39m::filter()
[31m✖[39m [34mdplyr[39m::[32mlag()[39m    masks [34mstats[39m::lag()

“package ‘tidymodels’ was built under R version 4.0.2”
── [1mAttaching packages[22m ────────────────────────────────────── tidymodels 0.1.1 ──

[32m✔

*Reading in data*

In [5]:
data <- read_csv("data/WineQT.csv")
data

Parsed with column specification:
cols(
  `fixed acidity` = [32mcol_double()[39m,
  `volatile acidity` = [32mcol_double()[39m,
  `citric acid` = [32mcol_double()[39m,
  `residual sugar` = [32mcol_double()[39m,
  chlorides = [32mcol_double()[39m,
  `free sulfur dioxide` = [32mcol_double()[39m,
  `total sulfur dioxide` = [32mcol_double()[39m,
  density = [32mcol_double()[39m,
  pH = [32mcol_double()[39m,
  sulphates = [32mcol_double()[39m,
  alcohol = [32mcol_double()[39m,
  quality = [32mcol_double()[39m,
  Id = [32mcol_double()[39m
)



fixed acidity,volatile acidity,citric acid,residual sugar,chlorides,free sulfur dioxide,total sulfur dioxide,density,pH,sulphates,alcohol,quality,Id
<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>
7.4,0.700,0.00,1.9,0.076,11,34,0.9978,3.51,0.56,9.4,5,0
7.8,0.880,0.00,2.6,0.098,25,67,0.9968,3.20,0.68,9.8,5,1
7.8,0.760,0.04,2.3,0.092,15,54,0.9970,3.26,0.65,9.8,5,2
11.2,0.280,0.56,1.9,0.075,17,60,0.9980,3.16,0.58,9.8,6,3
7.4,0.700,0.00,1.9,0.076,11,34,0.9978,3.51,0.56,9.4,5,4
7.4,0.660,0.00,1.8,0.075,13,40,0.9978,3.51,0.56,9.4,5,5
7.9,0.600,0.06,1.6,0.069,15,59,0.9964,3.30,0.46,9.4,5,6
7.3,0.650,0.00,1.2,0.065,15,21,0.9946,3.39,0.47,10.0,7,7
7.8,0.580,0.02,2.0,0.073,9,18,0.9968,3.36,0.57,9.5,7,8
6.7,0.580,0.08,1.8,0.097,15,65,0.9959,3.28,0.54,9.2,5,10


*Cleaning and Wrangling*

[insert units here]

In [7]:
data <- mutate(data, quality = as_factor(quality))
data

fixed acidity,volatile acidity,citric acid,residual sugar,chlorides,free sulfur dioxide,total sulfur dioxide,density,pH,sulphates,alcohol,quality,Id
<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<fct>,<dbl>
7.4,0.700,0.00,1.9,0.076,11,34,0.9978,3.51,0.56,9.4,5,0
7.8,0.880,0.00,2.6,0.098,25,67,0.9968,3.20,0.68,9.8,5,1
7.8,0.760,0.04,2.3,0.092,15,54,0.9970,3.26,0.65,9.8,5,2
11.2,0.280,0.56,1.9,0.075,17,60,0.9980,3.16,0.58,9.8,6,3
7.4,0.700,0.00,1.9,0.076,11,34,0.9978,3.51,0.56,9.4,5,4
7.4,0.660,0.00,1.8,0.075,13,40,0.9978,3.51,0.56,9.4,5,5
7.9,0.600,0.06,1.6,0.069,15,59,0.9964,3.30,0.46,9.4,5,6
7.3,0.650,0.00,1.2,0.065,15,21,0.9946,3.39,0.47,10.0,7,7
7.8,0.580,0.02,2.0,0.073,9,18,0.9968,3.36,0.57,9.5,7,8
6.7,0.580,0.08,1.8,0.097,15,65,0.9959,3.28,0.54,9.2,5,10


In [5]:
clean_data <- rename(data, snoring_rate = sr, 
                     respiration_rate = rr, body_temperature = t, limb_movements = lm, 
                     blood_oxygen_levels = bo, eye_movements = rem, hours_sleep = sr_1, 
                     heart_rate = hr, stress_level = sl)

In [19]:
clean_data_split <- initial_split(clean_data, prop = 0.5, strata = stress_level)
clean_data_train <- training(clean_data_split)
clean_data_test <- testing(clean_data_split)

In [20]:
clean_data_train <- clean_data_train

snoring_rate,respiration_rate,body_temperature,limb_movements,blood_oxygen_levels,eye_movements,hours_sleep,heart_rate,stress_level
<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>
60.000,20.000,96.000,10.000,95.000,85.00,7.000,60.00,1
47.000,16.800,97.200,5.600,95.800,68.00,7.800,52.00,0
50.000,18.000,99.000,8.000,97.000,80.00,9.000,55.00,0
55.520,19.104,95.104,9.104,93.656,82.76,6.104,57.76,1
73.440,21.344,93.344,11.344,91.344,91.72,4.016,63.36,2
96.288,26.288,85.360,17.144,82.432,100.36,0.000,75.72,4
52.640,18.528,94.528,8.528,92.792,81.32,5.528,56.32,1
81.560,22.416,90.208,12.520,88.208,95.52,0.208,66.04,3
89.960,24.656,91.328,15.320,89.328,98.32,1.328,71.64,3
53.680,18.736,94.736,8.736,93.104,81.84,5.736,56.84,1
