In [5]:
import pandas as pd
from sklearn.preprocessing import OneHotEncoder

# Load the dataset
data_path = 'CleanData.csv'
data = pd.read_csv(data_path)

# Remove the 'Unnamed: 0' column
data.drop('Unnamed: 0', axis=1, inplace=True)

# Convert 'Last Fight Date' to datetime format
data['Last Fight Date'] = pd.to_datetime(data['Last Fight Date'])

# Standardize 'Height' values (assumes the height format needs conversion from '511.0' to '71.0' for inches)
def convert_height_to_inches(height):
    feet = int(height / 100)
    inches = height % 100
    return feet * 12 + inches

data['Height'] = data['Height'].apply(convert_height_to_inches)

# One-hot encode 'Weight Class'
encoder = OneHotEncoder(sparse=False)
weight_class_encoded = encoder.fit_transform(data[['Weight Class']])
weight_class_encoded_df = pd.DataFrame(weight_class_encoded, columns=encoder.get_feature_names_out(['Weight Class']))

# Drop the original 'Weight Class' column and concatenate the new one-hot encoded columns
data.drop('Weight Class', axis=1, inplace=True)
data = pd.concat([data, weight_class_encoded_df], axis=1)

# Feature Engineering: Calculate days since the last fight
data['Days Since Last Fight'] = (pd.Timestamp.now().normalize() - data['Last Fight Date']).dt.days





In [10]:
results = pd.read_csv('Results.csv')