# Support Vector Regression


In [2]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.svm import SVR
from sklearn.metrics import mean_squared_error

# Load the dataset
data = pd.read_csv("vehicles_dataset_from_advertisement.csv")

# Drop rows with missing values
data = data.dropna()

# Select features and target variable
X = data[['model_year', 'odometer', 'condition', 'cylinders', 'fuel', 'transmission', 'type', 'paint_color']]
y = data['price']

# Perform one-hot encoding for categorical features
X = pd.get_dummies(X)

# Standardize features
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)

# Instantiate the SVR model
svr_model = SVR()

# Train the model
svr_model.fit(X_train, y_train)

# Make predictions
y_train_pred = svr_model.predict(X_train)
y_test_pred = svr_model.predict(X_test)

# Calculate Mean Squared Error
train_loss = mean_squared_error(y_train, y_train_pred)
test_loss = mean_squared_error(y_test, y_test_pred)

print("Train Loss:", train_loss)
print("Test Loss:", test_loss)


Train Loss: 129060095.99088883
Test Loss: 133831685.37310076
