# Importing Essential Packages

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline

from sklearn.pipeline import Pipeline
from sklearn.preprocessing import StandardScaler
from sklearn.decomposition import PCA
from sklearn.ensemble import RandomForestClassifier
from sklearn.svm import LinearSVC
from sklearn.model_selection import cross_val_score, train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.neural_network import MLPClassifier

import xgboost as xgb

import warnings
import os

# Loading Data and Basic Exploration

In [2]:
brainwave_df = pd.read_csv('emotions.csv')

In [3]:
# First 5 Rows

brainwave_df.head()

Unnamed: 0,# mean_0_a,mean_1_a,mean_2_a,mean_3_a,mean_4_a,mean_d_0_a,mean_d_1_a,mean_d_2_a,mean_d_3_a,mean_d_4_a,...,fft_741_b,fft_742_b,fft_743_b,fft_744_b,fft_745_b,fft_746_b,fft_747_b,fft_748_b,fft_749_b,label
0,4.62,30.3,-356.0,15.6,26.3,1.07,0.411,-15.7,2.06,3.15,...,23.5,20.3,20.3,23.5,-215.0,280.0,-162.0,-162.0,280.0,NEGATIVE
1,28.8,33.1,32.0,25.8,22.8,6.55,1.68,2.88,3.83,-4.82,...,-23.3,-21.8,-21.8,-23.3,182.0,2.57,-31.6,-31.6,2.57,NEUTRAL
2,8.9,29.4,-416.0,16.7,23.7,79.9,3.36,90.2,89.9,2.03,...,462.0,-233.0,-233.0,462.0,-267.0,281.0,-148.0,-148.0,281.0,POSITIVE
3,14.9,31.6,-143.0,19.8,24.3,-0.584,-0.284,8.82,2.3,-1.97,...,299.0,-243.0,-243.0,299.0,132.0,-12.4,9.53,9.53,-12.4,POSITIVE
4,28.3,31.3,45.2,27.3,24.5,34.8,-5.79,3.06,41.4,5.52,...,12.0,38.1,38.1,12.0,119.0,-17.6,23.9,23.9,-17.6,NEUTRAL


In [4]:
# Number of Dimensions

brainwave_df.shape

(2132, 2549)

In [5]:
# DataFrame Description

brainwave_df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2132 entries, 0 to 2131
Columns: 2549 entries, # mean_0_a to label
dtypes: float64(2548), object(1)
memory usage: 41.5+ MB


In [6]:
# Column Data Types

brainwave_df.dtypes

# mean_0_a    float64
mean_1_a      float64
mean_2_a      float64
mean_3_a      float64
mean_4_a      float64
               ...   
fft_746_b     float64
fft_747_b     float64
fft_748_b     float64
fft_749_b     float64
label          object
Length: 2549, dtype: object

In [8]:
# Descriptive Statistics

brainwave_df.describe()

Unnamed: 0,# mean_0_a,mean_1_a,mean_2_a,mean_3_a,mean_4_a,mean_d_0_a,mean_d_1_a,mean_d_2_a,mean_d_3_a,mean_d_4_a,...,fft_740_b,fft_741_b,fft_742_b,fft_743_b,fft_744_b,fft_745_b,fft_746_b,fft_747_b,fft_748_b,fft_749_b
count,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,...,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0,2132.0
mean,15.256914,27.012462,-104.975629,13.605898,24.150483,0.025378,0.052282,0.301655,0.036793,0.083567,...,-22.938971,104.946111,-51.973647,-51.973647,104.946111,-6.934144,95.104886,-49.061255,-49.061255,95.104886
std,15.284621,9.265141,206.27196,16.874676,14.18734,17.981796,8.509174,68.098894,17.010031,18.935378,...,298.034311,212.532721,112.160233,112.160233,212.532721,281.040552,203.194976,106.486317,106.486317,203.194976
min,-61.3,-114.0,-970.0,-137.0,-217.0,-218.0,-255.0,-1360.0,-203.0,-553.0,...,-1180.0,-921.0,-504.0,-504.0,-921.0,-1160.0,-1010.0,-521.0,-521.0,-1010.0
25%,6.5775,26.075,-195.0,4.8575,23.6,-3.105,-1.34,-4.0025,-2.905,-2.6225,...,-106.5,-8.365,-92.9,-92.9,-8.365,-102.5,-8.8375,-87.15,-87.15,-8.8375
50%,14.1,30.0,14.95,15.4,25.2,-0.0446,0.132,0.9575,-0.09975,0.1465,...,83.85,12.15,-21.8,-21.8,12.15,89.7,13.4,-24.1,-24.1,13.4
75%,27.7,31.4,29.6,26.5,26.8,2.92,1.54,6.735,2.535,2.87,...,154.0,177.0,12.025,12.025,177.0,153.0,149.25,10.925,10.925,149.25
max,304.0,42.3,661.0,206.0,213.0,402.0,257.0,1150.0,349.0,444.0,...,1070.0,843.0,1490.0,1490.0,843.0,1180.0,888.0,1670.0,1670.0,888.0
