# SVM after data pre-processing and with balance sampling

In [35]:
import numpy as np
import os
import cv2
from sklearn import svm
from sklearn.metrics import classification_report
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder, StandardScaler

In [36]:
# set the path to your data folder
data_folder = 'C:/Users/praveena/Downloads/archive (4)/data/'

In [37]:
# initialize lists to store data and labels
data = []
labels = []

In [38]:
# define the image size for resizing
image_size = (64, 64)

In [39]:
# loop over the subfolders to read the image data and labels
for folder in os.listdir(data_folder):
    folder_path = os.path.join(data_folder, folder)
    if os.path.isdir(folder_path):
        for filename in os.listdir(folder_path):
            if filename.endswith('.jpg'):
                image_path = os.path.join(folder_path, filename)
                image = cv2.imread(image_path)
                image = cv2.resize(image, image_size)
                data.append(image)
                labels.append(folder)

In [42]:
# convert data and labels to numpy arrays
data = np.array(data)
labels = np.array(labels)

In [43]:
# perform label encoding
label_encoder = LabelEncoder()
labels = label_encoder.fit_transform(labels)

In [44]:
# split data into train and test sets
X_train, X_test, y_train, y_test = train_test_split(data, labels, test_size=0.2, random_state=42)

In [45]:
# flatten the image data
num_pixels = np.prod(image_size) * 3
X_train = X_train.reshape(X_train.shape[0], num_pixels)
X_test = X_test.reshape(X_test.shape[0], num_pixels)

In [46]:
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

In [47]:
clf = svm.SVC(kernel='linear')
clf.fit(X_train, y_train)

In [48]:
# make predictions on the test data
y_pred = clf.predict(X_test)

In [50]:
from sklearn.metrics import accuracy_score
from sklearn.metrics import precision_score, recall_score, f1_score

In [51]:
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred, average='macro')
recall = recall_score(y_test, y_pred, average='macro')
f1 = f1_score(y_test, y_pred, average='macro')

In [52]:
print("Accuracy:", accuracy)

Accuracy: 0.7958333333333333


In [53]:
print("Precision:", precision)

Precision: 0.8123384446219415


In [54]:
print("Recall:", recall)

Recall: 0.7928830015900741


In [55]:
print("F1-score:", f1)

F1-score: 0.7860385633443893
