In [1]:
import os
import numpy as np
import cv2
from sklearn.preprocessing import StandardScaler
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score
from sklearn.utils import shuffle

# Helper function to load and preprocess images
def load_images_from_directory(directory, label, image_size=(32, 32)):
    data = []
    labels = []
    for file in os.listdir(directory):
        file_path = os.path.join(directory, file)
        if os.path.isfile(file_path):
            image = cv2.imread(file_path, cv2.IMREAD_GRAYSCALE)
            image = cv2.resize(image, image_size)
            data.append(image.flatten())
            labels.append(label)
    return np.array(data), np.array(labels)

# Load and preprocess data
def preprocess_data():
    # Load training data
    train_cats, train_cats_labels = load_images_from_directory('train/cats', 0)
    train_dogs, train_dogs_labels = load_images_from_directory('train/dogs', 1)
    
    X_train = np.vstack((train_cats, train_dogs))
    y_train = np.hstack((train_cats_labels, train_dogs_labels))
    
    # Load test data
    test_cats, test_cats_labels = load_images_from_directory('test/cats', 0)
    test_dogs, test_dogs_labels = load_images_from_directory('test/dogs', 1)
    
    X_test = np.vstack((test_cats, test_dogs))
    y_test = np.hstack((test_cats_labels, test_dogs_labels))
    
    # Shuffle and scale the data
    X_train, y_train = shuffle(X_train, y_train, random_state=42)
    scaler = StandardScaler()
    X_train = scaler.fit_transform(X_train)
    X_test = scaler.transform(X_test)
    
    return X_train, y_train, X_test, y_test

# Load data
X_train, y_train, X_test, y_test = preprocess_data()


In [6]:
from sklearn.model_selection import GridSearchCV

param_grid = {'C': [0.1, 1, 10], 'kernel': ['linear', 'rbf'], 'gamma': ['scale', 'auto']}
grid = GridSearchCV(SVC(max_iter=5000), param_grid, cv=3, verbose=3)
grid.fit(X_train, y_train)

print(f"Best Parameters: {grid.best_params_}")
best_model = grid.best_estimator_


Fitting 3 folds for each of 12 candidates, totalling 36 fits




[CV 1/3] END .C=0.1, gamma=scale, kernel=linear;, score=0.521 total time=  36.0s




[CV 2/3] END .C=0.1, gamma=scale, kernel=linear;, score=0.501 total time=  33.6s




[CV 3/3] END .C=0.1, gamma=scale, kernel=linear;, score=0.511 total time=  33.4s




[CV 1/3] END ....C=0.1, gamma=scale, kernel=rbf;, score=0.582 total time= 1.6min




[CV 2/3] END ....C=0.1, gamma=scale, kernel=rbf;, score=0.586 total time= 1.5min




[CV 3/3] END ....C=0.1, gamma=scale, kernel=rbf;, score=0.586 total time= 1.5min




[CV 1/3] END ..C=0.1, gamma=auto, kernel=linear;, score=0.521 total time=  32.3s




[CV 2/3] END ..C=0.1, gamma=auto, kernel=linear;, score=0.501 total time=  31.8s




[CV 3/3] END ..C=0.1, gamma=auto, kernel=linear;, score=0.511 total time=  32.3s




[CV 1/3] END .....C=0.1, gamma=auto, kernel=rbf;, score=0.579 total time= 1.5min




[CV 2/3] END .....C=0.1, gamma=auto, kernel=rbf;, score=0.593 total time= 1.6min




[CV 3/3] END .....C=0.1, gamma=auto, kernel=rbf;, score=0.596 total time= 1.5min




[CV 1/3] END ...C=1, gamma=scale, kernel=linear;, score=0.509 total time=  30.4s




[CV 2/3] END ...C=1, gamma=scale, kernel=linear;, score=0.501 total time=  32.7s




[CV 3/3] END ...C=1, gamma=scale, kernel=linear;, score=0.493 total time=  32.0s




[CV 1/3] END ......C=1, gamma=scale, kernel=rbf;, score=0.659 total time= 1.6min




[CV 2/3] END ......C=1, gamma=scale, kernel=rbf;, score=0.645 total time= 1.5min




[CV 3/3] END ......C=1, gamma=scale, kernel=rbf;, score=0.639 total time= 1.6min




[CV 1/3] END ....C=1, gamma=auto, kernel=linear;, score=0.509 total time=  31.3s




[CV 2/3] END ....C=1, gamma=auto, kernel=linear;, score=0.501 total time=  31.0s




[CV 3/3] END ....C=1, gamma=auto, kernel=linear;, score=0.493 total time=  30.6s




[CV 1/3] END .......C=1, gamma=auto, kernel=rbf;, score=0.658 total time= 1.5min




[CV 2/3] END .......C=1, gamma=auto, kernel=rbf;, score=0.642 total time= 1.5min




[CV 3/3] END .......C=1, gamma=auto, kernel=rbf;, score=0.647 total time= 1.4min




[CV 1/3] END ..C=10, gamma=scale, kernel=linear;, score=0.524 total time=  30.6s




[CV 2/3] END ..C=10, gamma=scale, kernel=linear;, score=0.501 total time=  30.8s




[CV 3/3] END ..C=10, gamma=scale, kernel=linear;, score=0.513 total time=  29.9s




[CV 1/3] END .....C=10, gamma=scale, kernel=rbf;, score=0.637 total time= 1.3min




[CV 2/3] END .....C=10, gamma=scale, kernel=rbf;, score=0.629 total time= 1.3min




[CV 3/3] END .....C=10, gamma=scale, kernel=rbf;, score=0.628 total time= 1.4min




[CV 1/3] END ...C=10, gamma=auto, kernel=linear;, score=0.524 total time=  29.8s




[CV 2/3] END ...C=10, gamma=auto, kernel=linear;, score=0.501 total time=  30.9s




[CV 3/3] END ...C=10, gamma=auto, kernel=linear;, score=0.513 total time=  29.1s




[CV 1/3] END ......C=10, gamma=auto, kernel=rbf;, score=0.634 total time= 1.3min




[CV 2/3] END ......C=10, gamma=auto, kernel=rbf;, score=0.634 total time= 1.4min




[CV 3/3] END ......C=10, gamma=auto, kernel=rbf;, score=0.627 total time= 1.3min
Best Parameters: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




In [2]:
# Train SVM
print("Training optimized SVM model...")
svm = SVC(kernel='rbf', max_iter=50000, verbose=True,gamma='auto',C=1) 
svm.fit(X_train, y_train)

Training optimized SVM model...
[LibSVM]

In [3]:
# Evaluate on test data
y_test_pred = svm.predict(X_test)
test_accuracy = accuracy_score(y_test, y_test_pred)
print(f"Test Accuracy: {test_accuracy:.2f}")

Test Accuracy: 0.66
