In [1]:
from typing import Optional, List, Dict, Union

import numpy as np
import pandas as pd

from IPython.display import display, HTML

from matplotlib import pyplot as plt

from tqdm.notebook import tqdm_notebook as tqdm

from notebook_utils.constants import PROJ_ROOT, NEW_GENRES, GENRE_COMBS, scale
from notebook_utils.predictions import Predictor
from notebook_utils.utils import display_df, setup_axis, process_and_scale, create_cmap

%load_ext autoreload
%autoreload 2

tqdm.pandas()

p = Predictor(models=["unigram"], first_1k=True)

  from pandas import Panel


# Show Loaded Data

In [2]:
p.loader.show_model_df("Unigram")

Book #,@Genre,first_1k,@Outcome
10368,Adventure_Stories,i was on a french steamer bound from havre to new york when i had a peculiar experience in the way o...,FAILURE
12190,Adventure_Stories,an introductory disaster early in the spring of the year 1884 the threemasted schooner castor from s...,FAILURE
13290,Adventure_Stories,editors note martin rattler was one of robert michael ballantynes early booksborn at edinburgh in 18...,FAILURE
...,...,...,...
29948,Short_Stories,experiment the first time machine gentlemen professor johnson proudly informed his two colleaguestru...,SUCCESSFUL
3815,Short_Stories,o henry afritechef of all delight of all delectables conglomerate that stay the starved brain and re...,SUCCESSFUL
8129,Short_Stories,preface poltarnees beholder of ocean blagdaross the madness of andelsprutz where the tides ebb and f...,SUCCESSFUL


In [3]:
p.loader.show_model_df("Bigram")

Book #,@Genre,first_1k,@Outcome
10368,Adventure_Stories,i was on a french steamer bound from havre to new york when i had a peculiar experience in the way o...,FAILURE
12190,Adventure_Stories,an introductory disaster early in the spring of the year 1884 the threemasted schooner castor from s...,FAILURE
13290,Adventure_Stories,editors note martin rattler was one of robert michael ballantynes early booksborn at edinburgh in 18...,FAILURE
...,...,...,...
29948,Short_Stories,experiment the first time machine gentlemen professor johnson proudly informed his two colleaguestru...,SUCCESSFUL
3815,Short_Stories,o henry afritechef of all delight of all delectables conglomerate that stay the starved brain and re...,SUCCESSFUL
8129,Short_Stories,preface poltarnees beholder of ocean blagdaross the madness of andelsprutz where the tides ebb and f...,SUCCESSFUL


In [4]:
p.loader.show_model_df("POS")

Book #,@Genre,VBD,IN,DT,...,ROOT,LS,ADD,META,@Outcome
10368,Adventure_Stories,0.341839,0.288571,0.292251,...,0.0,0.000000,0.0,0.0,FAILURE
12190,Adventure_Stories,0.331481,0.293392,0.415268,...,0.0,0.000000,0.0,0.0,FAILURE
13290,Adventure_Stories,0.314553,0.354935,0.473672,...,0.0,0.000000,0.0,0.0,FAILURE
15072,Adventure_Stories,0.208186,0.174560,0.221430,...,0.0,0.000000,0.0,0.0,FAILURE
18399,Adventure_Stories,0.198080,0.279921,0.379168,...,0.0,0.000000,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.084386,0.076858,0.114739,...,0.0,0.093333,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.208944,0.262904,0.394573,...,0.0,0.013333,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.006316,0.002411,0.000000,...,0.0,0.000000,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.148560,0.206183,0.293401,...,0.0,0.000000,0.0,0.0,SUCCESSFUL


In [5]:
p.loader.show_model_df("Lex")

Book #,@Genre,PRP -> i,DT -> a,JJ -> french,...,VB -> arleon,NN -> estabonn,VBP -> accrue,NN -> unforetold,@Outcome
10368,Adventure_Stories,0.830110,0.601103,0.138889,...,0.0,0.0,0.0,0.0,FAILURE
12190,Adventure_Stories,0.151934,0.610294,0.027778,...,0.0,0.0,0.0,0.0,FAILURE
13290,Adventure_Stories,0.194751,0.799632,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
15072,Adventure_Stories,0.321823,0.566176,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
18399,Adventure_Stories,0.256906,0.490809,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.040055,0.148897,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.168508,0.667279,0.138889,...,0.0,0.0,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.008287,0.000000,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.381215,0.573529,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL


In [6]:
p.loader.show_model_df("LexG")

Book #,@Genre,ROOT -> PRP -> i,PP -> DT -> a,PP -> JJ -> french,...,NP -> NNS -> bouts,ROOT -> RB -> guardedly,ROOT -> NN -> unforetold,S -> VBP -> foretell,@Outcome
10368,Adventure_Stories,0.579832,0.348214,0.333333,...,0.0,0.0,0.0,0.0,FAILURE
12190,Adventure_Stories,0.155462,0.392857,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
13290,Adventure_Stories,0.142857,0.714286,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
15072,Adventure_Stories,0.201681,0.339286,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
18399,Adventure_Stories,0.243697,0.383929,0.000000,...,0.0,0.0,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.063025,0.080357,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.197479,0.607143,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.008403,0.026786,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.462185,0.357143,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL


In [7]:
p.loader.show_model_df("Nonlex")

Book #,@Genre,NP -> PRP,NP -> DT JJ NN,NP -> NN,...,SQ -> PP VBZ NP ADVP VP,"S -> ADJP , SBAR : SINV .","X -> CC WRB DT NN VBD VBN CC DT NNS VBD RB , DT NN VBD RP IN PRP$ NN , CC VBG JJ NN , CC VBG IN DT NN IN PRP$ NN CC IN PDT PRP$ NNS IN PRP , VBN IN DT NN , VBG , '' VBD . '' CC DT NN VBD RB , VBG PRP$ JJ NN , CC VBD RB : `` EX VBP JJ NNS , '' PRP VBD , `` IN DT NNS IN NN WDT VBP VBN RB IN DT NN POS NNS , CC JJ JJR VBP JJ IN PRP WDT VBD JJR VBN IN DT : RB PRP VBP DT VBZ JJR NN , CC DT NNS WDT PRP MD RB VB IN NN IN NNS IN NN .",S -> CC S : SBAR . '' ADVP S : S .,@Outcome
10368,Adventure_Stories,0.996599,0.551570,0.632750,...,0.0,0.0,0.0,0.0,FAILURE
12190,Adventure_Stories,0.887755,0.612108,0.675676,...,0.0,0.0,0.0,0.0,FAILURE
13290,Adventure_Stories,0.793651,0.654709,0.828299,...,0.0,0.0,0.0,0.0,FAILURE
15072,Adventure_Stories,0.890023,0.336323,0.809221,...,0.0,0.0,0.0,0.0,FAILURE
18399,Adventure_Stories,0.780045,0.576233,0.597774,...,0.0,0.0,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.244898,0.183857,0.227345,...,0.0,0.0,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.675737,0.582960,0.615262,...,0.0,0.0,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.018141,0.000000,0.000000,...,0.0,0.0,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.798186,0.421525,0.511924,...,0.0,0.0,0.0,0.0,SUCCESSFUL


In [8]:
p.loader.show_model_df("NonlexG")

Book #,@Genre,ROOT -> NP -> PRP,PP -> NP -> DT JJ NN,PP -> NP -> NN,...,VP -> SQ -> PP VBZ NP ADVP VP,"ROOT -> S -> ADJP , SBAR : SINV .","ROOT -> X -> CC WRB DT NN VBD VBN CC DT NNS VBD RB , DT NN VBD RP IN PRP$ NN , CC VBG JJ NN , CC VBG IN DT NN IN PRP$ NN CC IN PDT PRP$ NNS IN PRP , VBN IN DT NN , VBG , '' VBD . '' CC DT NN VBD RB , VBG PRP$ JJ NN , CC VBD RB : `` EX VBP JJ NNS , '' PRP VBD , `` IN DT NNS IN NN WDT VBP VBN RB IN DT NN POS NNS , CC JJ JJR VBP JJ IN PRP WDT VBD JJR VBN IN DT : RB PRP VBP DT VBZ JJR NN , CC DT NNS WDT PRP MD RB VB IN NN IN NNS IN NN .",ROOT -> S -> CC S : SBAR . '' ADVP S : S .,@Outcome
10368,Adventure_Stories,0.629371,0.435644,0.47,...,0.0,0.0,0.0,0.0,FAILURE
12190,Adventure_Stories,0.585082,0.554455,0.42,...,0.0,0.0,0.0,0.0,FAILURE
13290,Adventure_Stories,0.396270,0.485149,0.34,...,0.0,0.0,0.0,0.0,FAILURE
15072,Adventure_Stories,0.421911,0.178218,0.31,...,0.0,0.0,0.0,0.0,FAILURE
18399,Adventure_Stories,0.459207,0.366337,0.28,...,0.0,0.0,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.179487,0.158416,0.15,...,0.0,0.0,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.540793,0.534653,0.41,...,0.0,0.0,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.032634,0.009901,0.00,...,0.0,0.0,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.650350,0.277228,0.27,...,0.0,0.0,0.0,0.0,SUCCESSFUL


In [9]:
p.loader.show_model_df("Phrasal")

Book #,@Genre,NP,VP,PP,...,LST,WHADJP,X,RRC,@Outcome
10368,Adventure_Stories,0.729850,0.830390,0.552301,...,0.006757,0.102564,0.166667,0.000000,FAILURE
12190,Adventure_Stories,0.685774,0.810549,0.558229,...,0.000000,0.051282,0.000000,0.142857,FAILURE
13290,Adventure_Stories,0.738393,0.684975,0.609833,...,0.000000,0.076923,0.166667,0.071429,FAILURE
15072,Adventure_Stories,0.539681,0.625212,0.349024,...,0.006757,0.102564,0.333333,0.000000,FAILURE
18399,Adventure_Stories,0.608518,0.676990,0.541492,...,0.013514,0.128205,0.000000,0.071429,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.201808,0.207597,0.161437,...,0.054054,0.000000,0.166667,0.071429,SUCCESSFUL
2777,Short_Stories,0.649870,0.538108,0.576360,...,0.006757,0.076923,0.000000,0.142857,SUCCESSFUL
29948,Short_Stories,0.005076,0.006049,0.004184,...,0.000000,0.000000,0.000000,0.000000,SUCCESSFUL
3815,Short_Stories,0.567166,0.497459,0.429568,...,0.013514,0.025641,0.166667,0.071429,SUCCESSFUL


In [10]:
p.loader.show_model_df("Roget")

Book #,@Genre,vehicle,ship,circumscription,...,numbness,analogy,zoology,inodorousness,@Outcome
10368,Adventure_Stories,0.273418,0.084699,0.391304,...,0.0,0.000000,0.0,0.0,FAILURE
12190,Adventure_Stories,0.508861,0.185792,0.086957,...,0.0,0.000000,0.0,0.0,FAILURE
13290,Adventure_Stories,0.526582,0.275956,0.173913,...,0.0,0.000000,0.0,0.0,FAILURE
15072,Adventure_Stories,0.453165,0.043716,0.000000,...,0.0,0.000000,0.0,0.0,FAILURE
18399,Adventure_Stories,0.308861,0.278689,0.086957,...,0.0,0.000000,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.101266,0.084699,0.043478,...,0.0,0.000000,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.400000,0.224044,0.260870,...,0.0,0.034483,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.025316,0.000000,0.000000,...,0.0,0.000000,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.367089,0.054645,0.217391,...,0.0,0.000000,0.0,0.0,SUCCESSFUL


In [11]:
p.loader.show_model_df("WordNet")

Book #,@Genre,be,exist,equal,...,bromo-seltzer,sheeting,unrepaired,tax-exempt,@Outcome
10368,Adventure_Stories,0.397547,0.416203,0.394758,...,0.0,0.0,0.0,0.0,FAILURE
12190,Adventure_Stories,0.368411,0.367752,0.364972,...,0.0,0.0,0.0,0.0,FAILURE
13290,Adventure_Stories,0.326959,0.328435,0.325655,...,0.0,0.0,0.0,0.0,FAILURE
15072,Adventure_Stories,0.230889,0.229944,0.228356,...,0.0,0.0,0.0,0.0,FAILURE
18399,Adventure_Stories,0.271940,0.271644,0.270453,...,0.0,0.0,0.0,0.0,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.120100,0.126688,0.119539,...,0.0,0.0,0.0,0.0,SUCCESSFUL
2777,Short_Stories,0.222829,0.224782,0.222002,...,0.0,0.0,0.0,0.0,SUCCESSFUL
29948,Short_Stories,0.004856,0.005163,0.004766,...,0.0,0.0,0.0,0.0,SUCCESSFUL
3815,Short_Stories,0.180926,0.183082,0.178713,...,1.0,1.0,0.0,0.0,SUCCESSFUL


In [12]:
p.loader.show_model_df("LIWC")

Book #,@Genre,future,i,past,...,relig,family,money,death,@Outcome
10368,Adventure_Stories,0.379189,0.407635,0.490017,...,0.153716,0.287879,0.256356,0.129310,FAILURE
12190,Adventure_Stories,0.307872,0.048424,0.368379,...,0.104730,0.050505,0.063559,0.088362,FAILURE
13290,Adventure_Stories,0.273188,0.079939,0.293595,...,0.138514,0.103535,0.239407,0.127155,FAILURE
15072,Adventure_Stories,0.274097,0.093262,0.301904,...,0.067568,0.333333,0.129237,0.023707,FAILURE
18399,Adventure_Stories,0.261756,0.106585,0.270167,...,0.432432,0.449495,0.266949,0.157328,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.066641,0.014348,0.083785,...,0.016892,0.002525,0.031780,0.038793,SUCCESSFUL
2777,Short_Stories,0.188101,0.050730,0.217888,...,0.065878,0.042929,0.256356,0.062500,SUCCESSFUL
29948,Short_Stories,0.005456,0.002306,0.005540,...,0.001689,0.000000,0.000000,0.004310,SUCCESSFUL
3815,Short_Stories,0.190699,0.130925,0.209925,...,0.060811,0.118687,0.273305,0.073276,SUCCESSFUL


In [13]:
p.loader.show_model_df("NRC")

Book #,@Genre,anger,anticipation,disgust,...,positive,sadness,surprise,trust,@Outcome
10368,Adventure_Stories,0.167778,0.161198,0.158824,...,0.260686,0.247542,0.405537,0.310249,FAILURE
12190,Adventure_Stories,0.262222,0.117261,0.248529,...,0.233245,0.294906,0.366450,0.195014,FAILURE
13290,Adventure_Stories,0.485556,0.174037,0.442647,...,0.347757,0.447721,0.589577,0.459280,FAILURE
15072,Adventure_Stories,0.144444,0.123252,0.147059,...,0.218734,0.174263,0.302932,0.232133,FAILURE
18399,Adventure_Stories,0.350000,0.159486,0.377941,...,0.287335,0.291332,0.407166,0.393906,FAILURE
...,...,...,...,...,...,...,...,...,...,...
27462,Short_Stories,0.155556,0.032525,0.107353,...,0.068074,0.127793,0.087948,0.099169,SUCCESSFUL
2777,Short_Stories,0.218889,0.114408,0.192647,...,0.245646,0.234138,0.353420,0.322992,SUCCESSFUL
29948,Short_Stories,0.004444,0.000000,0.011765,...,0.000000,0.002681,0.000000,0.006648,SUCCESSFUL
3815,Short_Stories,0.310000,0.083595,0.263235,...,0.166491,0.180518,0.263844,0.226039,SUCCESSFUL


# Train Models

In [14]:
no_reduc_accs = []

### Unigram

In [15]:
unigram_acc, uni_weights = p.predict_success(p.loader.unigram_df, "Unigram", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
Unigram,Adventure_Stories,0.77
Unigram,Fiction,0.66
Unigram,Historical_Fiction,0.56
Unigram,Love_Stories,0.67
Unigram,Mystery,0.77
Unigram,Poetry,0.74
Unigram,Science_Fiction,0.68
Unigram,Short_Stories,0.63
Unigram,Average,0.685


### Bigram

In [16]:
bigram_acc, bigram_weights = p.predict_success(p.loader.bigram_df, "Bigram", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
Bigram,Adventure_Stories,0.7
Bigram,Fiction,0.78
Bigram,Historical_Fiction,0.6
Bigram,Love_Stories,0.73
Bigram,Mystery,0.75
Bigram,Poetry,0.81
Bigram,Science_Fiction,0.54
Bigram,Short_Stories,0.62
Bigram,Average,0.69125


### POS

In [17]:
pos_acc, pos_weights = p.predict_success(p.loader.pos_df_scaled, "POS", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
POS,Adventure_Stories,0.66
POS,Fiction,0.74
POS,Historical_Fiction,0.58
POS,Love_Stories,0.69
POS,Mystery,0.5
POS,Poetry,0.77
POS,Science_Fiction,0.57
POS,Short_Stories,0.61
POS,Average,0.64


### Phrasal

In [18]:
phrasal_acc, phrasal_weights = p.predict_success(p.loader.phrasal_df_scaled, "Phrasal", ratio=0.2, disp_weights=True)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Feature,Weight
WHNP,1.032079
PP,0.573842
LST,0.544289
PRN,0.425144
UCP,0.422968
...,...
ADVP,-0.269928
WHPP,-0.336511
INTJ,-0.582772
PRT,-0.603378


Feature,Weight
PRT,1.230477
UCP,1.136040
WHNP,0.711995
PP,0.699109
QP,0.602911
...,...
ADVP,-0.322746
INTJ,-0.757073
ADJP,-0.786532
VP,-0.932505


Feature,Weight
CONJP,1.228494
WHNP,0.781362
PRN,0.595609
QP,0.550994
ADJP,0.316093
...,...
UCP,-0.314597
ADVP,-0.316990
NAC,-0.320590
VP,-0.541547


Feature,Weight
PP,1.739874
UCP,0.919448
CONJP,0.470607
WHPP,0.455710
X,0.422446
...,...
PRT,-0.350095
PRN,-0.455243
ADJP,-0.716273
VP,-0.770386


Feature,Weight
FRAG,1.291390
WHNP,1.264176
PRN,1.092232
NAC,0.533967
UCP,0.399262
...,...
X,-0.303254
INTJ,-0.309768
WHADJP,-0.407474
ADVP,-0.865071


Feature,Weight
WHADJP,1.054678
X,1.026432
CONJP,0.819705
PRT,0.643192
VP,0.546769
...,...
NP,-0.081172
NAC,-0.239500
WHNP,-0.432172
ADJP,-1.047455


Feature,Weight
PRT,1.240449
X,1.011311
PP,0.452391
NAC,0.395237
NP,0.268281
...,...
INTJ,-0.120369
ADJP,-0.130167
WHADJP,-0.251468
VP,-0.268541


Feature,Weight
PRT,0.947065
UCP,0.578130
CONJP,0.561600
PP,0.516226
NP,0.363105
...,...
PRN,-0.043398
WHNP,-0.133215
NAC,-0.594689
ADJP,-0.604593


Genre,Accuracy
Adventure_Stories,0.72
Fiction,0.63
Historical_Fiction,0.5
Love_Stories,0.7
Mystery,0.59
Poetry,0.59
Science_Fiction,0.59
Short_Stories,0.54
Average,0.6075


### $\Gamma$ (lexicalized production rules)

In [19]:
lex_acc, lex_weights = p.predict_success(p.loader.lex_df_scaled, "$\Gamma$", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
$\Gamma$,Adventure_Stories,0.62
$\Gamma$,Fiction,0.69
$\Gamma$,Historical_Fiction,0.53
$\Gamma$,Love_Stories,0.74
$\Gamma$,Mystery,0.78
$\Gamma$,Poetry,0.8
$\Gamma$,Science_Fiction,0.57
$\Gamma$,Short_Stories,0.68
$\Gamma$,Average,0.67625


### $\Gamma^G$ (lexicalized production rules, prepended with grandparent node)

In [20]:
lexg_acc, lexg_weights = p.predict_success(p.loader.lexg_df_scaled, "$\Gamma^G$", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
$\Gamma^G$,Adventure_Stories,0.64
$\Gamma^G$,Fiction,0.66
$\Gamma^G$,Historical_Fiction,0.56
$\Gamma^G$,Love_Stories,0.67
$\Gamma^G$,Mystery,0.78
$\Gamma^G$,Poetry,0.77
$\Gamma^G$,Science_Fiction,0.6
$\Gamma^G$,Short_Stories,0.68
$\Gamma^G$,Average,0.67


### $\gamma$ (nonlexicalized production rules)

In [21]:
nonlex_acc, nonlex_weights = p.predict_success(p.loader.nonlex_df_scaled, "$\gamma$", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
$\gamma$,Adventure_Stories,0.67
$\gamma$,Fiction,0.68
$\gamma$,Historical_Fiction,0.5
$\gamma$,Love_Stories,0.69
$\gamma$,Mystery,0.6
$\gamma$,Poetry,0.62
$\gamma$,Science_Fiction,0.57
$\gamma$,Short_Stories,0.57
$\gamma$,Average,0.6125


### $\gamma^G$ (nonlexicalized production rules, prepended with grandparent node)

In [22]:
nonlexg_acc, nonlexg_weights = p.predict_success(p.loader.nonlexg_df_scaled, "$\gamma^G$", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
$\gamma^G$,Adventure_Stories,0.68
$\gamma^G$,Fiction,0.72
$\gamma^G$,Historical_Fiction,0.56
$\gamma^G$,Love_Stories,0.62
$\gamma^G$,Mystery,0.63
$\gamma^G$,Poetry,0.69
$\gamma^G$,Science_Fiction,0.55
$\gamma^G$,Short_Stories,0.58
$\gamma^G$,Average,0.62875


### Roget

In [23]:
roget_acc, roget_weights = p.predict_success(p.loader.roget_df_scaled, "Roget", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
Roget,Adventure_Stories,0.71
Roget,Fiction,0.71
Roget,Historical_Fiction,0.54
Roget,Love_Stories,0.62
Roget,Mystery,0.68
Roget,Poetry,0.76
Roget,Science_Fiction,0.67
Roget,Short_Stories,0.65
Roget,Average,0.6675


### WordNet

In [24]:
wordnet_acc, wordnet_weights = p.predict_success(p.loader.wordnet_df_scaled, "WordNet", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
WordNet,Adventure_Stories,0.72
WordNet,Fiction,0.71
WordNet,Historical_Fiction,0.62
WordNet,Love_Stories,0.75
WordNet,Mystery,0.71
WordNet,Poetry,0.8
WordNet,Science_Fiction,0.59
WordNet,Short_Stories,0.62
WordNet,Average,0.69


### LIWC

In [25]:
liwc_acc, liwc_weights = p.predict_success(p.loader.liwc_df_scaled, "LIWC", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
LIWC,Adventure_Stories,0.66
LIWC,Fiction,0.65
LIWC,Historical_Fiction,0.52
LIWC,Love_Stories,0.46
LIWC,Mystery,0.71
LIWC,Poetry,0.6
LIWC,Science_Fiction,0.52
LIWC,Short_Stories,0.63
LIWC,Average,0.59375


### NRC Sentiment Emotion Lexicons

In [26]:
nrc_acc, nrc_weights = p.predict_success(p.loader.nrc_df_scaled, "NRC Sentiment", ratio=0.2, add_to_acc=no_reduc_accs, disp_weights=False)

HBox(children=(FloatProgress(value=0.0, max=40.0), HTML(value='')))




Model Name,Genre,Accuracy
NRC Sentiment,Adventure_Stories,0.65
NRC Sentiment,Fiction,0.66
NRC Sentiment,Historical_Fiction,0.6
NRC Sentiment,Love_Stories,0.59
NRC Sentiment,Mystery,0.71
NRC Sentiment,Poetry,0.63
NRC Sentiment,Science_Fiction,0.55
NRC Sentiment,Short_Stories,0.57
NRC Sentiment,Average,0.62
