# **Machine Learning Review**

- **Author** : starrykss
- **Date** : July 13, 2021

---

## **Linear Regression**

In [1]:
"""
Title : Linear Regression Practice with Boston Housing Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from tensorflow.keras import datasets
from sklearn.linear_model import LinearRegression

# Load Data
(train_data, train_label), (test_data, test_label) = datasets.boston_housing.load_data()

# Train
model_lr = LinearRegression()
model_lr.fit(train_data, train_label)

# Evaluation
prediction_lr = model_lr.predict(test_data)
error = sum(abs(prediction_lr - test_label)) / len(test_label)
print(error)

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/boston_housing.npz
3.4641858124067206


## **Logistic Regression**

In [2]:
"""
Title : Logistic Regression Practice with Breast Cancer Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from sklearn.datasets import load_breast_cancer
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split

# Load Data
cancer = load_breast_cancer()
data = cancer['data']
target = cancer['target']
train_data, test_data, train_label, test_label = train_test_split(data, target, test_size=0.2, random_state=1)

# Train
model_lr = LogisticRegression()
model_lr.fit(train_data, train_label)

# Evaluation
prediction_lr = model_lr.predict(test_data)
accuracy = sum(abs(prediction_lr == test_label)) / len(test_label)
print(accuracy)

0.9473684210526315


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


## **K-Nearest Neighbors**

In [3]:
"""
Title : K-Nearest Neighbors Practice with Breast Cancer Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from sklearn.datasets import load_breast_cancer
from sklearn.neighbors import KNeighborsClassifier
from sklearn.model_selection import train_test_split

# Load Data
cancer = load_breast_cancer()
data = cancer['data']
target = cancer['target']
train_data, test_data, train_label, test_label = train_test_split(data, target, test_size=0.2, random_state=1)

# Train
model_knn = KNeighborsClassifier()
model_knn.fit(train_data, train_label)

# Evaluation
prediction_knn = model_knn.predict(test_data)
accuracy = sum(abs(prediction_knn == test_label)) / len(test_label)
print(accuracy)

0.9385964912280702


## **Support Vector Machine(SVM)**

In [6]:
"""
Title : Support Vector Machine Practice with Breast Cancer Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from sklearn.datasets import load_breast_cancer
from sklearn.svm import SVC
from sklearn.model_selection import train_test_split

# Load Data
cancer = load_breast_cancer()
data = cancer['data']
target = cancer['target']
train_data, test_data, train_label, test_label = train_test_split(data, target, test_size=0.2, random_state=1)

# Train
model_svc = SVC(C=2)
model_svc.fit(train_data, train_label)

# Evaluation
prediction_svc = model_svc.predict(test_data)
accuracy = sum(abs(prediction_svc == test_label)) / len(test_label)
print(accuracy)

0.9122807017543859


## **Decision Tree**

In [4]:
"""
Title : Decision Tree Practice with Breast Cancer Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from sklearn.datasets import load_breast_cancer
from sklearn.tree import DecisionTreeClassifier
from sklearn.model_selection import train_test_split

# Load Data
cancer = load_breast_cancer()
data = cancer['data']
target = cancer['target']
train_data, test_data, train_label, test_label = train_test_split(data, target, test_size=0.2, random_state=1)

# Train
model_tree = DecisionTreeClassifier()
model_tree.fit(train_data, train_label)

# Evaluation
prediction_tree = model_tree.predict(test_data)
accuracy = sum(abs(prediction_tree == test_label)) / len(test_label)
print(accuracy)

0.9473684210526315


## **Random Forest**

In [5]:
"""
Title : Random Forest Practice with Breast Cancer Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from sklearn.datasets import load_breast_cancer
from sklearn.ensemble import RandomForestClassifier
from sklearn.model_selection import train_test_split

# Load Data
cancer = load_breast_cancer()
data = cancer['data']
target = cancer['target']
train_data, test_data, train_label, test_label = train_test_split(data, target, test_size=0.2, random_state=1)

# Train
model_rf = LogisticRegression()
model_rf.fit(train_data, train_label)

# Evaluation
prediction_rf = model_rf.predict(test_data)
accuracy = sum(abs(prediction_rf == test_label)) / len(test_label)
print(accuracy)

0.9473684210526315


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


## **XGBoost**

In [8]:
"""
Title : XGBoost Practice with Breast Cancer Dataset
Date : July 13, 2021
Author : starrykss
"""

# Load Library(Package)
from sklearn.datasets import load_breast_cancer
import xgboost as xgb
from sklearn.model_selection import train_test_split

# Load Data
cancer = load_breast_cancer()
data = cancer['data']
target = cancer['target']
train_data, test_data, train_label, test_label = train_test_split(data, target, test_size=0.2, random_state=1)

# Train
model_xg = xgb.XGBClassifier()
model_xg.fit(train_data, train_label)

# Evaluation
prediction_xg = model_xg.predict(test_data)
accuracy = sum(abs(prediction_xg == test_label)) / len(test_label)
print(accuracy)

0.956140350877193
