# Préparation des variables commerce

In [1]:
library(tidyverse)
library(factoextra)

# Charger les données
df_pilot1_2022 <- readRDS("../../../data/qc2022/preparation_donnees/01_pilot1_2022.rds")

# Préparation du jeu de données pour les variables de style
variables_commerce <- c(
  "id",
  "cons_brand_MaR",
  "cons_brand_BInd",
  "cons_brand_ChainesB",
  "cons_brand_GSurf",
  "cons_brand_OnlineOnly",
  "cons_brand_Frip",
  "cons_brand_Other",
  "cons_coffee_TimH",
  "cons_coffee_Starbucks",
  "cons_coffee_SC",
  "cons_coffee_McDo",
  "cons_coffee_Other",
  "cons_coffee_place_ind"
)

df_commerce <- df_pilot1_2022 %>%
  select(all_of(variables_commerce))

-- [1mAttaching core tidyverse packages[22m ------------------------ tidyverse 2.0.0 --
[32mv[39m [34mdplyr    [39m 1.1.4     [32mv[39m [34mreadr    [39m 2.1.5
[32mv[39m [34mforcats  [39m 1.0.0     [32mv[39m [34mstringr  [39m 1.5.1
[32mv[39m [34mggplot2  [39m 3.5.1     [32mv[39m [34mtibble   [39m 3.2.1
[32mv[39m [34mlubridate[39m 1.9.3     [32mv[39m [34mtidyr    [39m 1.3.1
[32mv[39m [34mpurrr    [39m 1.0.2     
-- [1mConflicts[22m ------------------------------------------ tidyverse_conflicts() --
[31mx[39m [34mdplyr[39m::[32mfilter()[39m masks [34mstats[39m::filter()
[31mx[39m [34mdplyr[39m::[32mlag()[39m    masks [34mstats[39m::lag()
[36mi[39m Use the conflicted package ([3m[34m<http://conflicted.r-lib.org/>[39m[23m) to force all conflicts to become errors
Welcome! Want to learn more? See two factoextra-related books at https://goo.gl/ve3WBa



In [3]:
# Boucle pour afficher la table pour chaque variable
for (v in variables_commerce) {
  if (v != "id") {
    cat("Table pour la variable:", v, "\n")
    print(table(df_commerce[[v]]))
    cat("\n\n")
  }
}

Table pour la variable: cons_brand_MaR 

   0    1 
1093  407 


Table pour la variable: cons_brand_BInd 

   0    1 
1369  131 


Table pour la variable: cons_brand_ChainesB 

   0    1 
1173  327 


Table pour la variable: cons_brand_GSurf 

   0    1 
1111  389 


Table pour la variable: cons_brand_OnlineOnly 

   0    1 
1414   86 


Table pour la variable: cons_brand_Frip 

   0    1 
1390  110 


Table pour la variable: cons_brand_Other 

   0    1 
1450   50 


Table pour la variable: cons_coffee_TimH 

   0    1 
1147  353 


Table pour la variable: cons_coffee_Starbucks 

   0    1 
1387  113 


Table pour la variable: cons_coffee_SC 

   0    1 
1492    8 


Table pour la variable: cons_coffee_McDo 

   0    1 
1330  170 


Table pour la variable: cons_coffee_Other 

   0    1 
1476   24 


Table pour la variable: cons_coffee_place_ind 

   0    1 
1404   96 




### Transformations

- cons_brand : Aucun changement

- cons_coffee : Regrouper SC (second cup) avec Other

In [4]:
# Regroupement de cons_coffee
#-----------------------------

df_commerce <- df_commerce %>%

  mutate(
    cons_coffee_Other = if_else(
      cons_coffee_SC == 1,
      1,
      cons_coffee_Other
    )
  ) %>%
  select(-cons_coffee_SC)

In [7]:
variables_commerce_clust <- c(
  "id",
  "cons_brand_MaR",
  "cons_brand_BInd",
  "cons_brand_ChainesB",
  "cons_brand_GSurf",
  "cons_brand_OnlineOnly",
  "cons_brand_Frip",
  "cons_brand_Other",
  "cons_coffee_TimH",
  "cons_coffee_Starbucks",
  "cons_coffee_McDo",
  "cons_coffee_Other",
  "cons_coffee_place_ind"
)

In [8]:
# Boucle pour afficher la table pour chaque variable
for (v in variables_commerce_clust) {
  if (v != "id") {
    cat("Table pour la variable:", v, "\n")
    print(table(df_commerce[[v]]))
    cat("\n\n")
  }
}

Table pour la variable: cons_brand_MaR 

   0    1 
1093  407 


Table pour la variable: cons_brand_BInd 

   0    1 
1369  131 


Table pour la variable: cons_brand_ChainesB 

   0    1 
1173  327 


Table pour la variable: cons_brand_GSurf 

   0    1 
1111  389 


Table pour la variable: cons_brand_OnlineOnly 

   0    1 
1414   86 


Table pour la variable: cons_brand_Frip 

   0    1 
1390  110 


Table pour la variable: cons_brand_Other 

   0    1 
1450   50 


Table pour la variable: cons_coffee_TimH 

   0    1 
1147  353 


Table pour la variable: cons_coffee_Starbucks 

   0    1 
1387  113 


Table pour la variable: cons_coffee_McDo 

   0    1 
1330  170 


Table pour la variable: cons_coffee_Other 

   0    1 
1468   32 


Table pour la variable: cons_coffee_place_ind 

   0    1 
1404   96 




In [9]:
# Sauvegarder les données préparées
saveRDS(df_commerce, file = "../../../data/qc2022/preparation_donnees/02_pilot1_2022_commerce.rds")