### 实现混淆矩阵计算精准率和召回率

In [1]:
import numpy as np
import sklearn.datasets as datasets

In [8]:
digits = datasets.load_digits()
X = digits.data
y = digits.target.copy()

y[digits.target == 9] = 1
y[digits.target != 9] = 0

In [9]:
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=666)

In [10]:
from sklearn.linear_model import LogisticRegression

lr = LogisticRegression()
lr.fit(X_train, y_train)
lr.score(X_test, y_test)



0.9755555555555555

In [12]:
y_predict = lr.predict(X_test)

In [15]:
def TN(y_true, y_predict):
    assert len(y_true) == len(y_predict)
    return np.sum((y_true == 0) & (y_predict == 0))

def FP(y_true, y_predict):
    assert len(y_true) == len(y_predict)
    return np.sum((y_true == 0) & (y_predict == 1))

def FN(y_true, y_predict):
    assert len(y_true) == len(y_predict)
    return np.sum((y_true == 1) & (y_predict == 0))

def TP(y_true, y_predict):
    assert len(y_true) == len(y_predict)
    return np.sum((y_true == 1) & (y_predict == 1))

In [16]:
print(TN(y_test, y_predict))
print(FP(y_test, y_predict))
print(FN(y_test, y_predict))
print(TP(y_test, y_predict))

403
2
9
36


In [20]:
def confusion_matrix(y_true, y_predict):
    return np.array([
        [TN(y_true, y_predict), FP(y_true, y_predict)],
        [FN(y_true, y_predict), TP(y_true, y_predict)]
    ])

confusion_matrix(y_test, y_predict)

array([[403,   2],
       [  9,  36]])

In [21]:
def precision_score(y_true, y_predict):
    tp = TP(y_true, y_predict)
    fp = FP(y_true, y_predict)
    return tp / (tp + fp)

precision_score(y_test, y_predict)

0.9473684210526315

In [22]:
def recall_score(y_true, y_predict):
    tp = TP(y_true, y_predict)
    fn = FN(y_true, y_predict)
    return tp / (tp + fn)

recall_score(y_test, y_predict)

0.8

### scikit-learn中的混淆矩阵，精准率和召回率

In [23]:
from sklearn.metrics import confusion_matrix
confusion_matrix(y_test, y_predict)

array([[403,   2],
       [  9,  36]], dtype=int64)

In [24]:
from sklearn.metrics import precision_score

precision_score(y_test, y_predict)

0.9473684210526315

In [26]:
from sklearn.metrics import recall_score

recall_score(y_test, y_predict)

0.8