In [1]:
# --- PART A: Model Building Script ---
import pandas as pd
import numpy as np
from sklearn.datasets import load_wine
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LogisticRegression
from sklearn.pipeline import Pipeline
from sklearn.metrics import accuracy_score, classification_report
import joblib
from google.colab import files

# 1. Load Data
data = load_wine()
df = pd.DataFrame(data.data, columns=data.feature_names)
df['target'] = data.target

# 2. Feature Selection (We pick 6 features as requested)
# These 6 are chemically distinct and good for prediction
selected_features = [
    'alcohol',
    'malic_acid',
    'ash',
    'alcalinity_of_ash',
    'magnesium',
    'color_intensity'
]

X = df[selected_features]
y = df['target']

# 3. Data Splitting
# Stratify ensures we have equal proportions of all 3 wine types in train/test
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42, stratify=y
)

# 4. Pipeline Construction (The "Pro" Move)
# We bundle the Scaler and the Model together.
# This satisfies the "Mandatory Scaling" requirement automatically.
pipeline = Pipeline([
    ('scaler', StandardScaler()),                 # Step 1: Scale Data
    ('classifier', LogisticRegression(max_iter=1000)) # Step 2: Train Model
])

# 5. Train
pipeline.fit(X_train, y_train)

# 6. Evaluate
y_pred = pipeline.predict(X_test)

print("--- Model Performance ---")
print(f"Accuracy: {accuracy_score(y_test, y_pred):.4f}")
print("\nClassification Report:")
print(classification_report(y_test, y_pred, target_names=data.target_names))

# 7. Save Model
joblib.dump(pipeline, 'wine_cultivar_model.pkl')
print("✅ Model saved as 'wine_cultivar_model.pkl'")

# 8. Download
files.download('wine_cultivar_model.pkl')

--- Model Performance ---
Accuracy: 0.9167

Classification Report:
              precision    recall  f1-score   support

     class_0       0.92      1.00      0.96        12
     class_1       0.93      0.93      0.93        14
     class_2       0.89      0.80      0.84        10

    accuracy                           0.92        36
   macro avg       0.91      0.91      0.91        36
weighted avg       0.92      0.92      0.92        36

✅ Model saved as 'wine_cultivar_model.pkl'


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>