In [29]:
import numpy as np
import pandas as pd
from sklearn import datasets
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.metrics import log_loss,accuracy_score,roc_auc_score

In [30]:
pipe = Pipeline([
    ("scaler",StandardScaler()),
    ("model",LogisticRegression(
    C=1.0,
    solver="lbfgs",
    penalty="l2",
    max_iter=10000,))
    ])

In [31]:
df = datasets.load_breast_cancer()
x = pd.DataFrame(data=df.data,columns=df.feature_names)
y = df.target
X,X_T,Y,Y_T = train_test_split(x,y,stratify=y,random_state=42,test_size=0.2)

In [32]:
pipe.fit(X,Y)
y_pred = pipe.predict(X_T)
y_prob = pipe.predict_proba(X_T)[:,1]
print("Accuracy :", accuracy_score(Y_T, y_pred))
print("Log loss :", log_loss(Y_T, y_prob))
print("ROC AUC  :", roc_auc_score(Y_T, y_prob))

Accuracy : 0.9824561403508771
Log loss : 0.07774649384096742
ROC AUC  : 0.9953703703703703


