# Audio Defect Classification using Logistic Regression

This notebook implements a Logistic Regression model for classifying audio defects.

In [None]:
import numpy as np
import pandas as pd
from sklearn.linear_model import LogisticRegression
from sklearn.multiclass import OneVsRestClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, accuracy_score
import joblib
import sys
sys.path.append('..')
from utils.defect_utils import preprocess_data

In [None]:
# Load dataset
df = pd.read_csv('../data/dataset.csv')
X, y = preprocess_data(df)

In [None]:
# Split data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [None]:
# Train Logistic Regression model for multi-label classification
log_model = OneVsRestClassifier(LogisticRegression(max_iter=1000))
log_model.fit(X_train, y_train)

In [None]:
# Evaluate model
y_pred = log_model.predict(X_test)
print(classification_report(y_test, y_pred))
print(f"Accuracy: {accuracy_score(y_test, y_pred)}")

In [None]:
# Save model
joblib.dump(log_model, '../models/logistic_defect.pkl')