# KNN Analysis Notebook

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import sys
import os

# Added path to access preprocessing functions
sys.path.append(os.path.abspath("../src"))


## 1. Data Preparation

### 1. Traffic Dataset

In [2]:
from data_processing.preprocess import load_traffic_data

(
    x_train_traffic,
    x_test_traffic,
    y_train_traffic,
    y_test_traffic,
    label_encoder_traffic,
    scaler_traffic
) = load_traffic_data()

display(x_train_traffic)

Unnamed: 0,CarCount,BikeCount,BusCount,TruckCount,Total,Month,Day,DayOfWeek_Thursday,Day of the week_Friday,Day of the week_Monday,...,Time_14,Time_15,Time_16,Time_17,Time_18,Time_19,Time_20,Time_21,Time_22,Time_23
3758,-1.229900,-0.911105,-0.883897,0.409641,-1.280845,0.0,0.0,True,False,False,...,False,False,False,False,False,False,False,False,False,False
7970,-1.141506,-0.911105,-0.959224,1.503125,-1.021278,0.0,0.0,True,False,False,...,False,False,False,False,False,False,False,False,False,False
6995,-0.412252,-0.255889,-0.733242,-1.412832,-0.813624,0.0,0.0,True,True,False,...,False,False,False,False,False,False,True,False,False,False
7287,0.869466,-0.337791,-0.130621,1.229754,0.812998,0.0,0.0,True,False,True,...,False,False,False,False,False,False,False,True,False,False
2327,-0.301759,-0.419693,-0.733242,-0.228225,-0.536752,0.0,0.0,True,True,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1328,0.007621,0.808836,0.020034,-0.410472,0.103514,0.0,0.0,True,False,True,...,False,False,False,False,False,False,True,False,False,False
8768,1.510325,1.791659,1.827896,-1.321709,1.730136,0.0,0.0,True,False,False,...,False,False,False,False,False,False,False,False,False,False
228,1.709212,1.382149,1.752569,-1.503956,1.747441,0.0,0.0,True,False,False,...,False,False,False,False,False,False,False,False,False,False
8317,0.206508,0.645032,-0.582586,-1.503956,-0.121444,0.0,0.0,True,True,False,...,False,True,False,False,False,False,False,False,False,False


### 2. Congressional Voting 

In [4]:
from data_processing.preprocess import load_congressional_voting_data

(
    x_train_voting,
    x_test_voting,
    y_train_voting,
    y_test_voting,
    label_encoder_voting,
    scaler_voting
) = load_congressional_voting_data()

display(x_train_voting)

Unnamed: 0,handicapped-infants,water-project-cost-sharing,adoption-of-the-budget-resolution,physician-fee-freeze,el-salvador-aid,religious-groups-in-schools,anti-satellite-test-ban,aid-to-nicaraguan-contras,mx-missile,immigration,synfuels-crporation-cutback,education-spending,superfund-right-to-sue,crime,duty-free-exports,export-administration-act-south-africa
202,-0.911770,0.818737,-1.204829,1.156919,1.0,0.72111,-1.188570,-1.273063,-0.948683,1.082326,1.366720,1.221394,0.887826,-1.204829,-0.864365,0.422249
73,-0.911770,-1.221394,-1.204829,1.156919,1.0,-1.38675,-1.188570,-1.273063,-0.948683,-0.923936,-0.731679,1.221394,-1.126347,0.829993,-0.864365,-2.368268
22,-0.911770,-1.221394,-1.204829,-0.864365,-1.0,-1.38675,0.841347,0.785507,1.054093,1.082326,-0.731679,1.221394,0.887826,0.829993,1.156919,0.422249
31,1.096767,0.818737,0.829993,-0.864365,-1.0,-1.38675,0.841347,0.785507,-0.948683,1.082326,-0.731679,-0.818737,-1.126347,-1.204829,-0.864365,0.422249
41,-0.911770,-1.221394,0.829993,-0.864365,-1.0,0.72111,0.841347,0.785507,1.054093,-0.923936,-0.731679,-0.818737,-1.126347,-1.204829,1.156919,0.422249
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
200,1.096767,0.818737,0.829993,-0.864365,-1.0,-1.38675,0.841347,0.785507,1.054093,-0.923936,1.366720,-0.818737,-1.126347,-1.204829,1.156919,0.422249
212,1.096767,0.818737,0.829993,-0.864365,-1.0,-1.38675,0.841347,0.785507,1.054093,-0.923936,1.366720,-0.818737,-1.126347,-1.204829,1.156919,0.422249
197,-0.911770,-1.221394,-1.204829,1.156919,1.0,0.72111,-1.188570,-1.273063,-0.948683,-0.923936,-0.731679,1.221394,0.887826,0.829993,-0.864365,-2.368268
122,-0.911770,-1.221394,-1.204829,1.156919,1.0,0.72111,0.841347,-1.273063,-0.948683,1.082326,-0.731679,1.221394,-1.126347,0.829993,1.156919,0.422249
