## 实现混淆矩阵、精准率与召回率

In [31]:
import numpy as np
from sklearn.datasets import load_digits

In [32]:
digits = load_digits()
X = digits.data
y = digits.target.copy()

y[digits.target == 9] = 1
y[digits.target != 9] = 0

In [33]:
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression

In [34]:
X_train,X_test,y_train,y_test = train_test_split(X,y,random_state=666)
log_reg = LogisticRegression()
log_reg.fit(X_train,y_train)



LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,
                   intercept_scaling=1, l1_ratio=None, max_iter=100,
                   multi_class='warn', n_jobs=None, penalty='l2',
                   random_state=None, solver='warn', tol=0.0001, verbose=0,
                   warm_start=False)

In [35]:
print(log_reg.score(X_test,y_test))

0.9755555555555555


In [36]:
def TN(true_res,predict_res):
    assert len(true_res) == len(predict_res)
    return np.sum((true_res==0) & (predict_res==0))
def FN(true_res,predict_res):
    assert len(true_res) == len(predict_res)
    return np.sum((true_res==1) & (predict_res==0))
def FP(true_res,predict_res):
    assert len(true_res) == len(predict_res)
    return np.sum((true_res==0) & (predict_res==1))
def TP(true_res,predict_res):
    assert len(true_res) == len(predict_res)
    return np.sum((true_res==1) & (predict_res==1))

In [37]:
def confusion_matrix(true_res,predict_res):
    return np.array([
        [TN(true_res,predict_res),FP(true_res,predict_res)],
        [FN(true_res,predict_res),TP(true_res,predict_res)]
    ])
def precise_rate(true_res,predict_res):
    tp = TP(true_res,predict_res)
    fp = FP(true_res,predict_res)
    try:
        return tp/(tp+fp)
    except ZeroDivisionError:
        return 0.0
def recall_rate(true_res,predict_res):
    tp = TP(true_res,predict_res)
    fn = FN(true_res,predict_res)
    try:
        return tp/(tp+fn)
    except ZeroDivisionError:
        return 0.0

In [38]:
y_predict = log_reg.predict(X_test)
print(confusion_matrix(y_test,y_predict))
print(precise_rate(y_test,y_predict))
print(recall_rate(y_test,y_predict))

[[403   2]
 [  9  36]]
0.9473684210526315
0.8


In [39]:
from sklearn.metrics import confusion_matrix
from sklearn.metrics import recall_score
from sklearn.metrics import precision_score

In [42]:
print(confusion_matrix(y_test,y_predict))
print(precision_score(y_test,y_predict))
print(recall_score(y_test,y_predict))

[[403   2]
 [  9  36]]
0.9473684210526315
0.8
