# Machine Learning Example

In [None]:
import pandas as pd

## Dataset: Graduate Admissions
### The following dataset will be used to learn to predict whether a student will be "Admitted" into graduate school. 

In [None]:
df = pd.read_csv("grad_admit.csv")
df = df.drop("Serial No.", axis=1)
df["Admitted"] = df["Admitted"].replace({"Yes": 1, "No":0})

df.head()

In [None]:
# Check the size of the data

df.shape

---

# Assuming the data has been prepared:

---

## Separate the data into X (features) and y (target)
#### Return only the values, not the DataFrame.

In [None]:
# Capital X indicates all of the features that the algorithm will be given to learn from.  
X = df.iloc[:, :-1].values

# Lowercase y indicates the target variable, the classifications that you would like to predict.  
y = df.iloc[:, -1].values

In [None]:
# Preview the first 10 rows

X[:10]

---

---

## Split the data into train and test sets

In [None]:
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=1, test_size=0.25)

In [None]:
X_train.shape, X_test.shape

In [None]:
# Preview the first 10 rows of X_train

X_train[:10]

In [None]:
# Preview the first 10 rows of y_train

y_train[:10]

---

## Standardize the data

In [None]:
# Standardize features using scikit-learn
from sklearn.preprocessing import StandardScaler
stdsc = StandardScaler()

X_train_std = stdsc.fit_transform(X_train)
X_test_std = stdsc.transform(X_test)

In [None]:
# standardized data
X_train_std[:5]

---

# Machine Learning

## Logistic Regression

In [None]:
from sklearn.linear_model import LogisticRegression

log_reg = LogisticRegression()

# Train the model on the training set
log_reg.fit(X_train_std, y_train);

 ### Evaluate the model's performance on the test set.
 Compares the model's predictions to the y_test answer key and returns the performance

In [None]:
log_reg.score(X_test_std, y_test)

---