## One-hot encoding
#### For categorical features with more than 3 categories
#### Will Transform the feature into multiple features with binary values

In [None]:
import pandas as pd

# One-hot encoding using Pandas
# We will just count how many different values there are in each categorical variable and consider only the variables with 3 or more values
# One-hot encoding aims to transform a categorical variable with n outputs into n binary variables.

# If its only two categories for a feature, then we can have the same feature be binary

df = pd.read_csv("heart.csv")

cat_variables = ['Sex',
'ChestPainType',
'RestingECG',
'ExerciseAngina',
'ST_Slope'
]

# Pandas has a built-in method to one-hot encode variables
# This will replace the columns with the one-hot encoded ones and keep the columns outside 'columns' argument as it is
# data: DataFrame to be used
# prefix: A list with prefixes, so we know which value we are dealing with
# columns: the list of columns that will be one-hot encoded. 'prefix' and 'columns' must have the same length.
df = pd.get_dummies(data = df,
                         prefix = cat_variables,
                         columns = cat_variables)