In [2]:
import pandas as pd
from sklearn.preprocessing import OneHotEncoder

In [3]:
# dummy dataset 
data = {'Employee_id': [10, 20, 15, 25, 30],
        'Gender': ['M', 'F', 'F', 'M', 'F'],
        'Remarks': ['Good', 'Nice', 'Good', 'Great', 'Nice']
        }

# creating dataframe
df = pd.DataFrame(data)

# printing dataframe
print(f"Employee data : \n{df}")

Employee data : 
   Employee_id Gender Remarks
0           10      M    Good
1           20      F    Nice
2           15      F    Good
3           25      M   Great
4           30      F    Nice


In [6]:
# extract the categorical columns from the data frame
categorical_columns = df.select_dtypes(include=['object']).columns.tolist()

# create a OneHotEncoder object
encoder = OneHotEncoder(sparse_output=False)

# apply the OneHotEncoder to the categorical columns
one_hot_encoded = encoder.fit_transform(df[categorical_columns])

# create a new dataframe with the one-hot encoded columns
# use the get_feature_names_out method to get the column names
one_hot_df = pd.DataFrame(one_hot_encoded, columns=encoder.get_feature_names_out(categorical_columns))

# concatenate the original dataframe with the one-hot encoded dataframe
df_encoded = pd.concat([df, one_hot_df], axis=1)

# drop the original categorical columns
df_encoded = df_encoded.drop(categorical_columns, axis=1)

# print the resulting dataframe
print(f"Encoded data : \n{df_encoded}")

Encoded data : 
   Employee_id  Gender_F  Gender_M  Remarks_Good  Remarks_Great  Remarks_Nice
0           10       0.0       1.0           1.0            0.0           0.0
1           20       1.0       0.0           0.0            0.0           1.0
2           15       1.0       0.0           1.0            0.0           0.0
3           25       0.0       1.0           0.0            1.0           0.0
4           30       1.0       0.0           0.0            0.0           1.0
