In [10]:
import pandas as pd

## Importing the dataset

In [11]:
dataset = pd.read_csv('Emotion_Sentences_Cross_Analysis.csv')
dataset = dataset.iloc[:,3:]

## Handling missing data

In [12]:
dataset = dataset[dataset.MPS.notnull()]

In [13]:
X = X = dataset[['Anger','Anticipation','Disgust','Fear','Joy','Sadness','Surprise','Trust']]
y_MPS = dataset.iloc[:, -4].values
y_TRT = dataset.iloc[:, -3].values
y_GD = dataset.iloc[:, -2].values
y_FFD = dataset.iloc[:, -1].values

## Model building

In [14]:
import statsmodels.api as sm

### Discrete emotions - Mean Pupil Size

In [15]:
X = sm.add_constant(X)
model_MPS = sm.OLS(y_MPS, X).fit()
model_MPS.summary()

0,1,2,3
Dep. Variable:,y,R-squared:,0.077
Model:,OLS,Adj. R-squared:,0.054
Method:,Least Squares,F-statistic:,3.273
Date:,"Sat, 07 Nov 2020",Prob (F-statistic):,0.00134
Time:,10:52:16,Log-Likelihood:,-1886.3
No. Observations:,322,AIC:,3791.0
Df Residuals:,313,BIC:,3825.0
Df Model:,8,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5,6
,coef,std err,t,P>|t|,[0.025,0.975]
const,3324.7863,7.002,474.837,0.000,3311.009,3338.563
Anger,-40.5889,35.698,-1.137,0.256,-110.827,29.649
Anticipation,-31.2026,17.404,-1.793,0.074,-65.446,3.041
Disgust,28.6897,37.393,0.767,0.444,-44.884,102.264
Fear,22.5137,25.865,0.870,0.385,-28.377,73.405
Joy,-21.1790,13.913,-1.522,0.129,-48.554,6.196
Sadness,41.8994,21.125,1.983,0.048,0.334,83.465
Surprise,-19.4050,39.442,-0.492,0.623,-97.010,58.200
Trust,-11.8619,8.657,-1.370,0.172,-28.895,5.171

0,1,2,3
Omnibus:,0.025,Durbin-Watson:,1.104
Prob(Omnibus):,0.988,Jarque-Bera (JB):,0.005
Skew:,0.008,Prob(JB):,0.997
Kurtosis:,2.988,Cond. No.,11.0


### Discrete emotions - Total Reading Time

In [16]:
model_TRT = sm.OLS(y_TRT, X).fit()
model_TRT.summary()

0,1,2,3
Dep. Variable:,y,R-squared:,0.213
Model:,OLS,Adj. R-squared:,0.192
Method:,Least Squares,F-statistic:,10.56
Date:,"Sat, 07 Nov 2020",Prob (F-statistic):,3.95e-13
Time:,10:52:16,Log-Likelihood:,-2688.5
No. Observations:,322,AIC:,5395.0
Df Residuals:,313,BIC:,5429.0
Df Model:,8,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5,6
,coef,std err,t,P>|t|,[0.025,0.975]
const,2304.3434,84.550,27.254,0.000,2137.985,2470.701
Anger,345.3330,431.059,0.801,0.424,-502.807,1193.473
Anticipation,806.0214,210.158,3.835,0.000,392.521,1219.522
Disgust,535.5215,451.532,1.186,0.237,-352.900,1423.943
Fear,-81.1226,312.324,-0.260,0.795,-695.642,533.397
Joy,261.7339,168.002,1.558,0.120,-68.821,592.289
Sadness,126.0973,255.090,0.494,0.621,-375.810,628.004
Surprise,-786.0567,476.269,-1.650,0.100,-1723.151,151.037
Trust,488.1826,104.535,4.670,0.000,282.503,693.862

0,1,2,3
Omnibus:,34.862,Durbin-Watson:,1.701
Prob(Omnibus):,0.0,Jarque-Bera (JB):,43.367
Skew:,0.82,Prob(JB):,3.83e-10
Kurtosis:,3.735,Cond. No.,11.0


### Discrete emotions - Gaze Duration

In [17]:
model_GD = sm.OLS(y_GD, X).fit()
model_GD.summary()

0,1,2,3
Dep. Variable:,y,R-squared:,0.236
Model:,OLS,Adj. R-squared:,0.216
Method:,Least Squares,F-statistic:,12.06
Date:,"Sat, 07 Nov 2020",Prob (F-statistic):,5.1e-15
Time:,10:52:16,Log-Likelihood:,-2610.3
No. Observations:,322,AIC:,5239.0
Df Residuals:,313,BIC:,5273.0
Df Model:,8,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5,6
,coef,std err,t,P>|t|,[0.025,0.975]
const,1772.0161,66.327,26.716,0.000,1641.514,1902.519
Anger,255.9097,338.152,0.757,0.450,-409.429,921.249
Anticipation,705.0300,164.862,4.276,0.000,380.652,1029.408
Disgust,310.4347,354.212,0.876,0.381,-386.504,1007.373
Fear,-31.6931,245.008,-0.129,0.897,-513.764,450.378
Joy,219.8409,131.792,1.668,0.096,-39.469,479.151
Sadness,117.4154,200.110,0.587,0.558,-276.315,511.146
Surprise,-549.6001,373.618,-1.471,0.142,-1284.721,185.520
Trust,396.5896,82.004,4.836,0.000,235.241,557.939

0,1,2,3
Omnibus:,43.105,Durbin-Watson:,1.783
Prob(Omnibus):,0.0,Jarque-Bera (JB):,58.352
Skew:,0.911,Prob(JB):,2.13e-13
Kurtosis:,4.016,Cond. No.,11.0


### Discrete emotions - First Fixation Duration

In [18]:
model_FFD = sm.OLS(y_FFD, X).fit()
model_FFD.summary()

0,1,2,3
Dep. Variable:,y,R-squared:,0.248
Model:,OLS,Adj. R-squared:,0.228
Method:,Least Squares,F-statistic:,12.88
Date:,"Sat, 07 Nov 2020",Prob (F-statistic):,4.92e-16
Time:,10:52:16,Log-Likelihood:,-2576.7
No. Observations:,322,AIC:,5171.0
Df Residuals:,313,BIC:,5205.0
Df Model:,8,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5,6
,coef,std err,t,P>|t|,[0.025,0.975]
const,1596.3725,59.754,26.716,0.000,1478.802,1713.943
Anger,194.1624,304.644,0.637,0.524,-405.247,793.572
Anticipation,631.3579,148.526,4.251,0.000,339.123,923.593
Disgust,264.9308,319.113,0.830,0.407,-362.947,892.809
Fear,28.2378,220.730,0.128,0.898,-406.064,462.540
Joy,219.8622,118.732,1.852,0.065,-13.752,453.477
Sadness,129.3430,180.280,0.717,0.474,-225.372,484.058
Surprise,-539.8393,336.596,-1.604,0.110,-1202.116,122.437
Trust,374.5040,73.878,5.069,0.000,229.143,519.865

0,1,2,3
Omnibus:,43.094,Durbin-Watson:,1.794
Prob(Omnibus):,0.0,Jarque-Bera (JB):,58.737
Skew:,0.904,Prob(JB):,1.76e-13
Kurtosis:,4.053,Cond. No.,11.0
