In [6]:
# Importing the necessary libraries
import pandas as pd
import numpy as np  # ✅ Corrected 'NumPy' to 'numpy'
from sklearn.compose import ColumnTransformer
from sklearn.preprocessing import OneHotEncoder, LabelEncoder

In [7]:
# Load the dataset
dataset = pd.read_csv('Titanic-Dataset.csv')

# Identify the categorical data
# Typically, 'Sex', 'Embarked', and 'Pclass' are categorical
categorical_features = ['Sex', 'Embarked', 'Pclass']

In [8]:
# Implement an instance of the ColumnTransformer class
column_transformer = ColumnTransformer(
    transformers=[
        ('encoder', OneHotEncoder(), categorical_features)
    ],
    remainder='passthrough'  
)

# Apply the fit_transform method on the instance of ColumnTransformer
X = column_transformer.fit_transform(dataset)

# Convert the output into a NumPy array
X = np.array(X)

In [9]:
# Use LabelEncoder to encode binary categorical data
# In Titanic dataset, 'Survived' is typically the target variable
label_encoder = LabelEncoder()
y = label_encoder.fit_transform(dataset['Survived'])

In [10]:
print("Encoded Feature Matrix (X):")
print(X)

print("\nEncoded Dependent Variable Vector (y):")
print(y)

Encoded Feature Matrix (X):
[[0.0 1.0 0.0 ... 'A/5 21171' 7.25 nan]
 [1.0 0.0 1.0 ... 'PC 17599' 71.2833 'C85']
 [1.0 0.0 0.0 ... 'STON/O2. 3101282' 7.925 nan]
 ...
 [1.0 0.0 0.0 ... 'W./C. 6607' 23.45 nan]
 [0.0 1.0 1.0 ... '111369' 30.0 'C148']
 [0.0 1.0 0.0 ... '370376' 7.75 nan]]

Encoded Dependent Variable Vector (y):
[0 1 1 1 0 0 0 0 1 1 1 1 0 0 0 1 0 1 0 1 0 1 1 1 0 1 0 0 1 0 0 1 1 0 0 0 1
 0 0 1 0 0 0 1 1 0 0 1 0 0 0 0 1 1 0 1 1 0 1 0 0 1 0 0 0 1 1 0 1 0 0 0 0 0
 1 0 0 0 1 1 0 1 1 0 1 1 0 0 1 0 0 0 0 0 0 0 0 1 1 0 0 0 0 0 0 0 1 1 0 1 0
 0 0 0 0 0 0 0 0 0 0 0 0 1 0 1 0 1 1 0 0 0 0 1 0 0 1 0 0 0 0 1 1 0 0 0 1 0
 0 0 0 1 0 0 0 0 1 0 0 0 0 1 0 0 0 1 1 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 1
 0 1 1 0 0 1 0 1 1 1 1 0 0 1 0 0 0 0 0 1 0 0 1 1 1 0 1 0 0 0 1 1 0 1 0 1 0
 0 0 1 0 1 0 0 0 1 0 0 1 0 0 0 1 0 0 0 1 0 0 0 0 0 1 1 0 0 0 0 0 0 1 1 1 1
 1 0 1 0 0 0 0 0 1 1 1 0 1 1 0 1 1 0 0 0 1 0 0 0 1 0 0 1 0 1 1 1 1 0 0 0 0
 0 0 1 1 1 1 0 1 0 1 1 1 0 1 1 1 0 0 0 1 1 0 1 1 0 0 1 1 0 1 0 1 1 1 1 0 0
