Title: Popular Classification Algorithms

Support Vector Machines (SVM)

Task 1: Identify handwriting on checks and classify each letter.

In [1]:
from sklearn import datasets
from sklearn.model_selection import train_test_split
from sklearn.svm import SVC

digits = datasets.load_digits()
X = digits.data
y = digits.target

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = SVC()
model.fit(X_train, y_train)
predictions = model.predict(X_test)

print("Predicted digits:", predictions)


Predicted digits: [6 9 3 7 2 1 5 2 5 2 1 9 4 0 4 2 3 7 8 8 4 3 9 7 5 6 3 5 6 3 4 9 1 4 4 6 9
 4 7 6 6 9 1 3 6 1 3 0 6 5 5 1 9 5 6 0 9 0 0 1 0 4 5 2 4 5 7 0 7 5 9 5 5 4
 7 0 4 5 5 9 9 0 2 3 8 0 6 4 4 9 1 2 8 3 5 2 9 0 4 4 4 3 5 3 1 3 5 9 4 2 7
 7 4 4 1 9 2 7 9 7 2 6 9 4 0 7 2 7 5 8 7 5 7 9 0 6 6 4 2 8 0 9 4 6 9 9 6 9
 0 3 5 6 6 0 6 4 3 9 3 7 7 2 9 0 4 5 3 6 5 9 9 8 4 2 1 3 7 7 2 2 3 9 8 0 3
 2 2 5 6 9 9 4 1 5 4 2 3 6 4 8 5 9 5 7 8 9 4 8 1 5 4 4 9 6 1 8 6 0 4 5 2 7
 4 6 4 5 6 0 3 2 3 6 7 1 5 1 4 7 6 8 8 5 5 1 6 2 8 8 9 5 7 6 2 2 2 3 4 8 8
 3 6 0 9 7 7 0 1 0 4 5 1 5 3 6 0 4 1 0 0 3 6 5 9 7 3 5 5 9 9 8 5 3 3 2 0 5
 8 3 4 0 2 4 6 4 3 4 5 0 5 2 1 3 1 4 1 1 7 0 1 5 2 1 2 8 7 0 6 4 8 8 5 1 8
 4 5 8 7 9 8 6 0 6 2 0 7 9 8 9 5 2 7 7 1 8 7 4 3 8 3 5]



Task 2: Detect gender of a speaker based on voice data.

In [2]:
from sklearn.model_selection import train_test_split
from sklearn.svm import SVC
import pandas as pd

data = pd.DataFrame({
    'MeanFreq': [0.15, 0.20, 0.13, 0.25, 0.18, 0.22, 0.14, 0.24, 0.19, 0.23],
        'SD': [0.02, 0.03, 0.015, 0.035, 0.025, 0.028, 0.018, 0.032, 0.027, 0.030],
            'Gender': [1, 0, 1, 0, 1, 0, 1, 0, 1, 0]
            })

X = data[['MeanFreq', 'SD']]
y = data['Gender']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = SVC()
model.fit(X_train, y_train)
predictions = model.predict(X_test)

print("Predicted genders:", predictions)

Predicted genders: [1 0]


Task 3: Classify email topics based on content.

In [3]:
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.model_selection import train_test_split
from sklearn.svm import SVC

emails = [
    "Meeting scheduled for project updates",
        "Limited time offer on electronics",
            "Team outing next Friday",
                "Your invoice for last month",
                    "Flash sale on shoes today",
                        "Let's discuss the new marketing strategy",
                            "Discounts available on your favorite brands",
                                "Submit your report by Monday",
                                    "Huge savings on home appliances",
                                        "Client feedback received"
                                        ]
labels = [0, 1, 0, 2, 1, 0, 1, 0, 1, 2]

vectorizer = TfidfVectorizer()
X = vectorizer.fit_transform(emails)
y = labels

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = SVC()
model.fit(X_train, y_train)
predictions = model.predict(X_test)

print("Predicted email topics:", predictions)

Predicted email topics: [0 0]
