In [None]:
from sklearn.linear_model import LinearRegression
from sklearn.datasets import load_boston
from sklearn.model_selection import train_test_split

boston = load_boston()
X, y = boston.data, boston.target

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=123)
lr = LinearRegression()
lr.fit(X_train, y_train)

y_pred = lr.predict(X_test)

In [None]:
import matplotlib.pyplot as plt

fig, ax = plt.subplots()
ax.scatter(y_pred, y_test)
ax.plot((0,50), (0,50), linestyle='dashed', color='red')
ax.set_xlabel('predicted value')
ax.set_ylabel('actual value')

plt.show()

In [None]:
import numpy as np

np.random.seed(223)

X = np.random.random(size=50)
Y = 2*X + 0.5*np.random.rand(50) 

fig, ax = plt.subplots()
ax.scatter(X, Y)

plt.show()

In [None]:
from sklearn.decomposition import PCA

pca = PCA(n_components=2)
X_pca = pca.fit_transform(np.hstack((X[:, np.newaxis], Y[:, np.newaxis])))

fig, ax = plt.subplots()
ax.scatter(X_pca[:, 0], X_pca[:, 1])
ax.set_xlabel('PC1')
ax.set_ylabel('PC2')
ax.set_xlim(-1.1, 1.1)
ax.set_ylim(-1.1, 1.1)

plt.show()

In [None]:
from sklearn.datasets import load_iris 
from sklearn.svm import SVC

iris = load_iris()
X, y = iris.data[:100, :], iris.target[:100]
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=123)

svc = SVC()
svc.fit(X_train, y_train)
y_pred = svc.predict(X_test)

In [None]:
from sklearn.metrics import classification_report

print(classification_report(y_test, y_pred))

In [None]:
from sklearn.model_selection import cross_val_score

svc = SVC()
cross_val_score(svc, X, y, cv=10, scoring='precision')

In [None]:
fpr0 = np.array([0,0,0,1,1,2,3,3,3,3,4,5,5,6,7,8,8,8,9,10,10,11,12,12,13,14])/14
tpr0 = np.array([0,1,2,2,3,3,3,4,5,6,6,6,7,7,7,7,8,9,9,9,10,10,10,11,11,11])/11

fig, ax = plt.subplots()
ax.step(fpr0, tpr0)
ax.set_xlabel('false positive rate')
ax.set_ylabel('true positive label')
plt.show()

In [None]:
from sklearn.metrics import roc_curve

labels = np.array([1,1,0,1,0,0,1,1,1,0,0,1,0,0,0,1,1,0,0,1,0,0,1,0,0])
probs = np.array([0.98,0.95,0.9,0.87,0.85,0.8,0.75,0.71,0.63,0.55,0.51,0.47,0.43,0.38,
                  0.35,0.31,0.28,0.24,0.22,0.19,0.15,0.12,0.08,0.04,0.01])
fpr, tpr, threshold = roc_curve(labels, probs)
print('False Positive Rate:', fpr)
print('True Positive Rate:', tpr)

In [None]:
fig, ax = plt.subplots()
ax.step(fpr, tpr)
ax.set_xlabel('false positive rate')
ax.set_ylabel('true positive label')
plt.show()

In [None]:
from sklearn.metrics import roc_auc_score

# AUC(Area Under the Curve)を算出
roc_auc_score(labels, probs)