In [1]:
import os
import sys
import time
import numpy as np
import matplotlib.pyplot as plt
module_path = os.path.abspath(os.path.join('../../fusion'))
sys.path.append(module_path)

from preprocessing_datasets.preprocessing_utilities import ValueUtils
from preprocessing_datasets import load_dataset
from embedding_algorithms import sentence_embedding, set_embedding_model
from dimensionality_reduction_algorithms import dimension_reduction_algorithms
from cluster_algorithms import cluster_algorithm

from helper import load_by_index, get_author_candidates, getFinalAuthors, launchWithoutReductionFusion
from plot_tools import plotChart, plotCluster

In [2]:
key_values = {
    'model_type':'bilstm',
    'char_level':False,
    'model_version': 2,
    'rnn_dim':1024,
    'verbose':1,
    'attributes_list': ['author'],
    'embedding_type': 'inferSent',
    'dataset': 'clean_book',
    'cluster_method': 'hierarchy',
    'num_clusters_rate': 0.1,
    'block_length_thresold': 0.2,
    'acceptance_diff': 2,
}

In [3]:
dataset_name, table_group_by_isbn, isbn_list, true_authors = load_dataset(key_values)

dataset: clean_book
Loading time is: 3.329498052597046


In [4]:
set_embedding_model(key_values)

Vocab size : 2196017
model_version: 2
rnn_dim: 1024
model_type: bilstm
char_level: False
Setup time is: 237.48902702331543


In [5]:
start_time = time.time()
finalAuthors, trueAuthors = launchWithoutReductionFusion(table_group_by_isbn, isbn_list, true_authors, key_values)
print("Total time is: {0}".format(time.time() - start_time))

ISBN: 0007197160
true author: Marren Peter
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 1.1552519798278809
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.25911974906921387
Discarted candidate: [{'conservation officer': 2, 'former scientist': 2}, {'marren naturalist peter': 2}]
Possible candidate: [{'marren peter': 19}]
lengthNecessary: 5.0
[{'marren peter': 19}]
['marren peter'] VS true_author: ['marren peter']
ISBN: 0029011086
true author: Averill James R.,Nunley Elma P.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09791183471679688
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0023818016052246094
Discarted candidate: [{'elma nunley p': 4}, {'averill': 1, 'james r': 1}]
Possible candidate: [{'averill james r': 21}]
lengthNecessary: 5.4
[{'averill james r': 21}]
['averill james r'] 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08865213394165039
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001789093017578125
Discarted candidate: []
Possible candidate: [{'charles e osgood': 5, 'miron': 1, 'miron murray s': 4}, {'author': 2, 'h may william': 5}]
lengthNecessary: 3.4000000000000004
[{'charles e osgood': 5, 'miron': 1, 'miron murray s': 4}, {'author': 2, 'h may william': 5}]
['charles e osgood', 'miron murray s', 'author', 'h may william'] VS true_author: ['charles e osgood', 'h may william', 'miron murray s']
ISBN: 0262680718
true author: Rosenbloom Paul S.,Laird John E.,Newell Allen
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04846811294555664
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0009949207305908203
Discarted candidate: []
Possible candidate: [{'alle

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05223393440246582
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0016481876373291016
Discarted candidate: [{'maurice thompson': 1}]
Possible candidate: [{'moritz thomsen': 16}]
lengthNecessary: 3.4000000000000004
[{'moritz thomsen': 16}]
['moritz thomsen'] VS true_author: ['moritz thomsen']
ISBN: 0439436559
true author: Nix Garth
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08256673812866211
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.0042269229888916016
Discarted candidate: [{'garth nix': 2}, {'garth nix': 1}, {'garth nix': 1}, {'garth nix': 1}, {'garth nix': 1}]
Possible candidate: [{'garth nix': 45}]
lengthNecessary: 10.200000000000001
[{'garth nix': 45}]
['garth nix'] VS true_author: ['garth nix']
ISBN: 0439670195
true author: Ker

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20477700233459473
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.012493133544921875
Discarted candidate: [{'donald katz': 18}, {'adult viking': 1}, {'adult viking': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}]
Possible candidate: [{'donald katz r': 76}]
lengthNecessary: 20.400000000000002
[{'donald katz r': 76}]
['donald katz r'] VS true_author: ['donald katz r']
ISBN: 0671640984
true author: Turnbull Colin M.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10827898979187012
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.005129814147949219
Discarted candidate: [{'colin turnbull': 7}, {'turnbull': 2}, {'colin m turnbull': 1}, {'colin m turnbull': 1}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0762178897857666
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002029895782470703
Discarted candidate: [{'beattie william': 5}, {'beatty dr william': 1}, {'beattie w': 1}]
Possible candidate: [{'a m ross': 1, 'alexander m ross': 22, 'alexander ross': 1}]
lengthNecessary: 6.2
[{'a m ross': 1, 'alexander m ross': 22, 'alexander ross': 1}]
['alexander m ross'] VS true_author: ['alexander m ross']
ISBN: 0802115462
true author: Weddle David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.058576107025146484
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0018248558044433594
Discarted candidate: [{'american heritage': 1}]
Possible candidate: [{'david peckinpah re sam weddle': 1, 'david weddle': 16}]
lengthNecessary: 3.6
[{'david peckinpah re sam w

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.043578147888183594
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0011382102966308594
Discarted candidate: []
Possible candidate: [{'burt carl': 5, 'ny press research': 1}]
lengthNecessary: 1.2000000000000002
[{'burt carl': 5, 'ny press research': 1}]
['burt carl'] VS true_author: ['burt carl']
ISBN: 186152207X
true author: Pass Christopher,Lowes Bryan,Robinson Andrew
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07018494606018066
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0019102096557617188
Discarted candidate: []
Possible candidate: [{'c l pass': 6, 'chris pass': 2, 'christopher pass': 1, 'pass': 5}, {'bryan lowes': 4, 'bryan lowes pass': 1, 'byran lowes': 3}, {'andrew robinson': 6, 'christopher': 1}]
lengthNecessary: 5.80000000000

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06488537788391113
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0016367435455322266
Discarted candidate: [{'d m': 1}]
Possible candidate: [{'matthew sleeth': 14}, {'zondervan': 9}]
lengthNecessary: 4.800000000000001
[{'matthew sleeth': 14}, {'zondervan': 9}]
['matthew sleeth', 'zondervan'] VS true_author: ['matthew sleeth']
ISBN: 0080174159
true author: Braund  H. E. W.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04276108741760254
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0014050006866455078
Discarted candidate: []
Possible candidate: [{'braund e h': 1, 'braund e h w': 5, 'braund harold': 1}]
lengthNecessary: 1.4000000000000001
[{'braund e h': 1, 'braund e h w': 5, 'braund harold': 1}]
['braund e h w'] VS true_author: ['braund e h

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10740995407104492
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.004541873931884766
Discarted candidate: [{'hudson r': 1}]
Possible candidate: [{'hudson rock': 14}, {'davidson sara': 14}]
lengthNecessary: 5.800000000000001
[{'hudson rock': 14}, {'davidson sara': 14}]
['hudson rock', 'davidson sara'] VS true_author: ['hudson rock', 'davidson sara']
ISBN: 0300063555
true author: Barrell John
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17871499061584473
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0023679733276367188
Discarted candidate: [{'barrell john professor': 3}, {'barrell john': 2}, {'barrel john': 1}]
Possible candidate: [{'barrell john': 25}]
lengthNecessary: 6.2
[{'barrell john': 25}]
['barrell john'] VS true_author: ['barrell 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08681011199951172
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0022559165954589844
Discarted candidate: []
Possible candidate: [{'e mark mendenhall': 12}, {'g?nter k stahl': 4, 'gunter k stahl': 1, 'günter k stahl': 1, 'stahl': 3}, {'gary oddou r': 7}, {'m mendenhall': 2, 'mendenhall': 2, 'mendenhall oddou': 3}]
lengthNecessary: 7.0
[{'e mark mendenhall': 12}, {'g?nter k stahl': 4, 'gunter k stahl': 1, 'günter k stahl': 1, 'stahl': 3}, {'gary oddou r': 7}, {'m mendenhall': 2, 'mendenhall': 2, 'mendenhall oddou': 3}]
['e mark mendenhall', 'g?nter k stahl', 'stahl', 'gary oddou r', 'mendenhall', 'mendenhall oddou'] VS true_author: ['e mark mendenhall', 'gary oddou r', 'günter k stahl']
ISBN: 0446514098
true author: Gale Robert Peter,Hauser Thomas
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Emb

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08022403717041016
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.004913806915283203
Discarted candidate: [{'rich': 1}, {'deborah hawkins': 1}]
Possible candidate: [{'deutschlander ed': 18}, {'campe deutschlander ed': 1, 'campe rich': 16}]
lengthNecessary: 7.4
[{'deutschlander ed': 18}, {'campe deutschlander ed': 1, 'campe rich': 16}]
['deutschlander ed', 'campe rich'] VS true_author: ['deutschlander ed', 'campe rich']
ISBN: 0615314074
true author: Chetouane Djaffar
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.030305862426757812
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0015022754669189453
Discarted candidate: [{'inscribed': 1}, {'chetouane djaffar': 1}]
Possible candidate: [{'chetouane djaffar': 19}]
lengthNecessary: 4.2
[{'chetouan

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06746387481689453
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0016047954559326172
Discarted candidate: []
Possible candidate: [{'margaret weis': 11}, {'a valerie valusek': 1, 'etal': 1, 'hickman tracy': 6, 'jaquays paul': 1}]
lengthNecessary: 4.0
[{'margaret weis': 11}, {'a valerie valusek': 1, 'etal': 1, 'hickman tracy': 6, 'jaquays paul': 1}]
['margaret weis', 'hickman tracy'] VS true_author: ['margaret weis', 'hickman tracy']
ISBN: 0810907240
true author: Grundberg Andy
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.041938066482543945
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.001692056655883789
Discarted candidate: [{'alexey brodovitch': 2}, {'andy grundberg': 1}]
Possible candidate: [{'andy grundberg': 20}]
lengthNecessary: 4.6

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04812908172607422
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0014917850494384766
Discarted candidate: []
Possible candidate: [{'bruce koffler': 12}, {'clive dobson': 4}]
lengthNecessary: 3.2
[{'bruce koffler': 12}, {'clive dobson': 4}]
['bruce koffler', 'clive dobson'] VS true_author: ['bruce koffler']
ISBN: 0950176311
true author: Kersting A. F.,Watkin David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.03151893615722656
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0015292167663574219
Discarted candidate: []
Possible candidate: [{'a f kersting': 2, 'david watkin': 3}]
lengthNecessary: 1.0
[{'a f kersting': 2, 'david watkin': 3}]
['a f kersting', 'david watkin'] VS true_author: ['a david f kersting watkin']
ISBN: 0961515007
true aut

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06459593772888184
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0012271404266357422
Discarted candidate: []
Possible candidate: [{'a': 1, 'rod schumacher': 11}, {'donald rodney schumacher': 3}]
lengthNecessary: 3.0
[{'a': 1, 'rod schumacher': 11}, {'donald rodney schumacher': 3}]
['rod schumacher', 'donald rodney schumacher'] VS true_author: ['rod schumacher']
ISBN: 1931456372
true author: Anghie Christine
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.038657188415527344
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0018711090087890625
Discarted candidate: [{'aguanno pmp': 1}]
Possible candidate: [{'anghie christine': 11, 'kevin mapm': 1}]
lengthNecessary: 2.6
[{'anghie christine': 11, 'kevin mapm': 1}]
['anghie christine'] VS true_autho

NUM_CLUSTERS 4
Blocking time is: 0.003058910369873047
Discarted candidate: [{'black clara': 1}, {'black cara': 1}, {'black cara': 1}]
Possible candidate: [{'black cara': 29}]
lengthNecessary: 6.4
[{'black cara': 29}]
['black cara'] VS true_author: ['black cara']
ISBN: 3877580505
true author: Wolff H. G.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07065606117248535
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0018219947814941406
Discarted candidate: []
Possible candidate: [{'g h wolff': 1, 'g hans wolff': 1, 'g?nter hans': 1, 'g?nter hans wolff': 3, 'gunter hans wolff': 2, 'hunde katzen wolff': 1}]
lengthNecessary: 1.8
[{'g h wolff': 1, 'g hans wolff': 1, 'g?nter hans': 1, 'g?nter hans wolff': 3, 'gunter hans wolff': 2, 'hunde katzen wolff': 1}]
['g h wolff', 'g?nter hans', 'g?nter hans wolff', 'hunde katzen wolff'] VS true_author: ['g h wolff']
ISBN: 0520212118
true author: Erring

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1328279972076416
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.005006074905395508
Discarted candidate: [{'dean karlan': 1}, {'appel jacob': 1}, {'dean karlan': 1}, {'appel jacob': 1}]
Possible candidate: [{'dean karlan': 29}, {'appel jacob': 21}]
lengthNecessary: 10.8
[{'dean karlan': 29}, {'appel jacob': 21}]
['dean karlan', 'appel jacob'] VS true_author: ['dean karlan', 'appel jacob']
ISBN: 0375501037
true author: Jones Steve
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09764599800109863
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.003298044204711914
Discarted candidate: [{'j k rowling': 5}, {'jones steve': 1}, {'jones steve': 1}]
Possible candidate: [{'jones steve': 30}]
lengthNecessary: 7.4
[{'jones steve': 30}]
['jones steve'] VS

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.16419291496276855
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0036160945892333984
Discarted candidate: []
Possible candidate: [{'b': 1, 'b nuland sherwin': 9}, {'nuland sherwin': 7}]
lengthNecessary: 3.4000000000000004
[{'b': 1, 'b nuland sherwin': 9}, {'nuland sherwin': 7}]
['b nuland sherwin'] VS true_author: ['b nuland sherwin']
ISBN: 0333349954
true author: Pym Barbara
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.21249985694885254
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.004172801971435547
Discarted candidate: [{'barbara hazel holt pym': 1}]
Possible candidate: [{'barbara pym': 16}, {'hilary pym': 9}, {'hazel holt': 8}]
lengthNecessary: 6.800000000000001
[{'barbara pym': 16}, {'hilary pym': 9}, {'hazel holt': 8}]
['barbara p

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1494579315185547
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.006466865539550781
Discarted candidate: [{'green jonathon': 6}, {'green jonathan': 2}, {'green jonathan': 1}, {'green jonathan': 1}, {'green jonathan': 1}, {'green jonathon': 1}, {'green jonathon': 1}]
Possible candidate: [{'green jonathon': 59}]
lengthNecessary: 14.4
[{'green jonathon': 59}]
['green jonathon'] VS true_author: ['green jonathon']
ISBN: 0295961309
true author: Fowler David C.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07881593704223633
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0018911361694335938
Discarted candidate: [{'c david fowler professor': 5}, {'fowler': 5}]
Possible candidate: [{'c david fowler': 17, 'david fowler': 2}]
lengthNecessary: 5.800000

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.16508102416992188
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.013216972351074219
Discarted candidate: [{"health magazine men's": 4}, {"health magazine men's of the": 2}, {'g mark': 1}, {'books health mens staff': 1}, {"health men's of": 1}, {"health men's": 1}, {"books health men's staff": 1}, {'dollemore doug': 1}]
Possible candidate: [{'dollemore doug': 44, 'dollermore doug': 1}, {'giuliucci mark': 42, 'giuliuci mark': 1}]
lengthNecessary: 20.0
[{'dollemore doug': 44, 'dollermore doug': 1}, {'giuliucci mark': 42, 'giuliuci mark': 1}]
['dollemore doug', 'giuliucci mark'] VS true_author: ['dollemore doug', 'giuliucci mark']
ISBN: 0471177881
true author: Yeager Neil,Hough Lee
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2067561149597168
cluster_method: hierarchy
num_clus

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07815885543823242
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0026640892028808594
Discarted candidate: [{'betrayal heart?s pb': 1}, {'coble colleen': 1}, {'coble colleen': 1}, {'coble colleen': 1}]
Possible candidate: [{'coble colleen': 37}]
lengthNecessary: 8.200000000000001
[{'coble colleen': 37}]
['coble colleen'] VS true_author: ['coble colleen']
ISBN: 0932750559
true author: Prechter Robert R. Jr.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06349396705627441
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0016918182373046875
Discarted candidate: []
Possible candidate: [{'jr prechter r robert': 13}, {'prechter r robert': 7, 'prechter robert': 1}, {'classics library new': 1, 'inc': 1, 'jr': 4, 'jr r': 1}]
lengthNecessary: 5.6000000

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06204509735107422
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0015230178833007812
Discarted candidate: [{'steve thomas': 4}, {'d stephen thomas': 1}]
Possible candidate: [{'d stephen thomas': 18}]
lengthNecessary: 4.6000000000000005
[{'d stephen thomas': 18}]
['d stephen thomas'] VS true_author: ['steve thomas']
ISBN: 1846250811
true author: McQuoid Stephen
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.03134632110595703
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0009260177612304688
Discarted candidate: []
Possible candidate: [{'mcquoid': 1, 'mcquoid stephen': 6, 'phd': 2, 'stephen': 1}]
lengthNecessary: 2.0
[{'mcquoid': 1, 'mcquoid stephen': 6, 'phd': 2, 'stephen': 1}]
['mcquoid stephen'] VS true_author: ['mcquoid stephen']
ISBN: 0

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07210898399353027
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0026569366455078125
Discarted candidate: [{'american association diabetes': 1}, {'good phyllis': 1}, {'good phyllis': 1}]
Possible candidate: [{'good pellman phyllis': 4, 'good phyllis': 29}]
lengthNecessary: 7.2
[{'good pellman phyllis': 4, 'good phyllis': 29}]
['good phyllis'] VS true_author: ['good pellman phyllis']
ISBN: 1555426654
true author: Rothwell William J.,Kazanas H. C.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0634453296661377
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001188039779663086
Discarted candidate: []
Possible candidate: [{'j rothwell william': 9}, {'c h kazanas': 7}]
lengthNecessary: 3.2
[{'j rothwell william': 9}, {'c h kazanas': 7}]
['j roth

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0879220962524414
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.002562999725341797
Discarted candidate: []
Possible candidate: [{'amanda jessica salmonson': 14}, {'a jessica salmonson': 1, 'jessica salmonson': 5}]
lengthNecessary: 4.0
[{'amanda jessica salmonson': 14}, {'a jessica salmonson': 1, 'jessica salmonson': 5}]
['amanda jessica salmonson'] VS true_author: ['amanda jessica salmonson']
ISBN: 1579125255
true author: Hathaway Nancy
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06727886199951172
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0014960765838623047
Discarted candidate: [{'hathaway': 1}, {'hathaway nancy': 1}]
Possible candidate: [{'hathaway nancy': 22}]
lengthNecessary: 4.800000000000001
[{'hathaway nancy': 22}]
['hathawa

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10423827171325684
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0029718875885009766
Discarted candidate: [{'james mckean n': 3}, {'james mckean': 2}, {'james mckean': 1}]
Possible candidate: [{'james mckean': 28}]
lengthNecessary: 6.800000000000001
[{'james mckean': 28}]
['james mckean'] VS true_author: ['james mckean']
ISBN: 0805043683
true author: Moe Richard,Wilkie Carter
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2158348560333252
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.010936975479125977
Discarted candidate: [{'moe richard': 1}, {'carter wilkie': 1}, {'carter wilkie': 1}, {'carter wilkie': 1}, {'carter wilkie': 1}, {'carter wilkie': 1}, {'carter wilkie': 1}]
Possible candidate: [{'moe richard': 46}, {'carter wilkie': 37}]
l

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2581198215484619
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01586627960205078
Discarted candidate: [{'morrison toni': 1}, {'morrrison toni': 1}, {'morrison toni': 1}, {'morrison toni': 1}, {'morrison toni': 1}, {'morrison toni': 1}, {'morrison toni': 1}, {'morrison toni': 1}, {'morrison toni': 1}]
Possible candidate: [{'morrison toni': 105}]
lengthNecessary: 22.8
[{'morrison toni': 105}]
['morrison toni'] VS true_author: ['morrison toni']
ISBN: 0306803038
true author: Cabanne Pierre
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20998382568359375
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.012924909591674805
Discarted candidate: [{'jasper johns': 6}, {'duchamp marcel': 4}, {'an appreciation jasper johns': 2}, {'padgett ron': 2}, {'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08167886734008789
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0027692317962646484
Discarted candidate: [{'agatha christie': 2}, {'collectif': 1}, {'agatha christie': 1}]
Possible candidate: [{'agatha christie': 32}]
lengthNecessary: 7.2
[{'agatha christie': 32}]
['agatha christie'] VS true_author: ['agatha christie']
ISBN: 0094646805
true author: Poucher W. A.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.058547258377075195
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.002290010452270508
Discarted candidate: [{'a poucher w': 1}]
Possible candidate: [{'a poucher w': 18}, {'arthur poucher william': 5}]
lengthNecessary: 4.800000000000001
[{'a poucher w': 18}, {'arthur poucher william': 5}]
['a poucher w', 'arthur poucher william'] VS tru

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08724617958068848
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0031599998474121094
Discarted candidate: [{'grove pr': 1}, {'peter throckmotron': 1}]
Possible candidate: [{'peter throckmorton': 26}]
lengthNecessary: 5.6000000000000005
[{'peter throckmorton': 26}]
['peter throckmorton'] VS true_author: ['peter throckmorton']
ISBN: 0521433606
true author: Manly Peter L.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09411501884460449
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0017981529235839844
Discarted candidate: [{'astronomie rarit?t': 1}, {'l manly peter': 1}]
Possible candidate: [{'l manly peter': 24}]
lengthNecessary: 5.2
[{'l manly peter': 24}]
['l manly peter'] VS true_author: ['l manly peter']
ISBN: 1890771848
true author: Mad

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10877680778503418
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0031418800354003906
Discarted candidate: [{'design glaser milton the': 1}, {'a foreword george lang': 1}, {'klein matthew photographs': 1}]
Possible candidate: [{'judith olney': 36}]
lengthNecessary: 7.800000000000001
[{'judith olney': 36}]
['judith olney'] VS true_author: ['judith olney']
ISBN: 0471490768
true author: Wiseman Helen,Goldfarb Peter,Ridgway Tim,Wiseman Alan
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10280776023864746
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0031921863555908203
Discarted candidate: [{'goldfarb peter': 6, 'goldfarb peter ridgway tim': 1}, {'alan wiseman': 6}, {'ridgway tim': 6}, {'wiseman': 4}]
Possible candidate: [{'helen wiseman': 19}

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07719087600708008
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015101432800292969
Discarted candidate: []
Possible candidate: [{'cma': 1, 'cpa': 1, 'cpa davidson sidney': 1, 'davidson in-chief sidney': 1, 'davidson sidney': 6}, {'l roman weil': 6, 'roman weil': 2}]
lengthNecessary: 3.6
[{'cma': 1, 'cpa': 1, 'cpa davidson sidney': 1, 'davidson in-chief sidney': 1, 'davidson sidney': 6}, {'l roman weil': 6, 'roman weil': 2}]
['davidson sidney', 'l roman weil'] VS true_author: ['l roman weil', 'davidson sidney']
ISBN: 0785288104
true author: Jones Laurie Beth
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06733369827270508
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.002020120620727539
Discarted candidate: [{'jones': 1}, {'jones laurie':

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05341005325317383
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0031239986419677734
Discarted candidate: [{'alan titchmarsh': 1}, {'alan titchmarsh': 1}, {'alan titchmarsh': 1}, {'alan titchmarsh': 1}]
Possible candidate: [{'alan titchmarsh': 38, 'alan titichmarsh': 2}]
lengthNecessary: 8.8
[{'alan titchmarsh': 38, 'alan titichmarsh': 2}]
['alan titchmarsh'] VS true_author: ['alan titchmarsh']
ISBN: 0899061710
true author: Goldberg Chaim Binyamin
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.061586856842041016
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0011248588562011719
Discarted candidate: []
Possible candidate: [{'?ayim b ben binyamin goldberg p': 1, 'binyamin chaim goldberg': 3, 'fox-ashrei shlomo': 2, 'meir zlotowitz': 3}, {'go

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07007837295532227
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.003545999526977539
Discarted candidate: [{'k nair': 1}, {'keshavan nair': 1}, {'keshavan nair': 1}, {'keshavan nair': 1}]
Possible candidate: [{'keshavan nair': 44, 'nair': 1}]
lengthNecessary: 9.8
[{'keshavan nair': 44, 'nair': 1}]
['keshavan nair'] VS true_author: ['keshavan nair']
ISBN: 0415422051
true author: Emmerson Richard K.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10382270812988281
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0033540725708007812
Discarted candidate: [{'clayton-emmerson sandra': 4}, {'clayton-emmerson sandra': 2}, {'clayton-emmerson eds sandra': 1}, {'emmerson k richard': 1}]
Possible candidate: [{'emmerson k richard': 39}]
lengthNecessary: 9.

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07187294960021973
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.003612041473388672
Discarted candidate: [{'iii kiechel walter': 7}, {'kiechel w': 4}, {'kiechel w': 1}, {'kiechel walter': 1}]
Possible candidate: [{'kiechel walter': 29, 'walter': 1}]
lengthNecessary: 8.6
[{'kiechel walter': 29, 'walter': 1}]
['kiechel walter'] VS true_author: ['iii kiechel walter']
ISBN: 0733306195
true author: Dickson Wright Clarissa,Paterson Jennifer
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06725811958312988
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001589059829711914
Discarted candidate: [{'clarissa dickson wright': 3}]
Possible candidate: [{'clarissa dickson-wright': 3, 'dickson-wright': 2, 'dickson-wright paterson': 5, 'jennifer paterson': 3

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04700016975402832
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015099048614501953
Discarted candidate: [{'h?l?ne hanff': 1}]
Possible candidate: [{'hanff helene': 17}]
lengthNecessary: 3.6
[{'hanff helene': 17}]
['hanff helene'] VS true_author: ['hanff helene']
ISBN: 014006060X
true author: Mortimer John
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04000401496887207
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0009458065032958984
Discarted candidate: []
Possible candidate: [{'clifford john mortimer': 1, 'john mortimer': 2}]
lengthNecessary: 0.6000000000000001
[{'clifford john mortimer': 1, 'john mortimer': 2}]
['clifford john mortimer', 'john mortimer'] VS true_author: ['john mortimer']
ISBN: 0262122995
true author: Lyson Thomas A.,

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08495283126831055
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0026590824127197266
Discarted candidate: [{'carlson melody': 1}, {'a carlson melody': 1}]
Possible candidate: [{'a carlson melody': 26}, {'carlson melody': 9}]
lengthNecessary: 7.4
[{'a carlson melody': 26}, {'carlson melody': 9}]
['a carlson melody'] VS true_author: ['carlson melody']
ISBN: 0297646281
true author: Nuland Sherwin B.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05945706367492676
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0011789798736572266
Discarted candidate: [{'da leonardo vinci': 1}]
Possible candidate: [{'b nuland sherwin': 8, 'nuland sherwin': 5}]
lengthNecessary: 2.8000000000000003
[{'b nuland sherwin': 8, 'nuland sherwin': 5}]
['b nuland sherwin'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3179152011871338
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.013994216918945312
Discarted candidate: [{'cuddihy jane mary': 1, 'mary p': 1}, {'cuddihy john murray': 1, 'f john murray': 1}, {'clendenin j ryan': 1, 'j lannan patrick': 1}, {'fr regis ryan': 1}, {'alison murray': 1}, {'charlotte harrris mcdonald': 1}, {'design dunbar patricia': 1}, {'donald marshall w': 1}, {'cuddihy de harriet haven': 1}]
Possible candidate: [{'birmingham stephen': 86}]
lengthNecessary: 19.6
[{'birmingham stephen': 86}]
['birmingham stephen'] VS true_author: ['birmingham stephen']
ISBN: 0060112980
true author: Ford Betty
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.46541500091552734
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02936697006225586
Disca

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.37836503982543945
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.009633779525756836
Discarted candidate: [{'bienvenu marcelle': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}]
Possible candidate: [{'emeril lagasse': 73}]
lengthNecessary: 16.0
[{'emeril lagasse': 73}]
['emeril lagasse'] VS true_author: ['emeril lagasse']
ISBN: 006018650X
true author: Taylor Bradford Barbara
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3575630187988281
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01780414581298828
Discarted candidate: [{'barbara bradford taylor': 2}, {'barbera bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1},

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1867227554321289
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.006478071212768555
Discarted candidate: [{'e feist raymond': 2}, {'e feist raymong': 1}, {'e feist raymond': 1}, {'e feist raymond': 1}, {'e feist raymond': 1}, {'e feist raymond': 1}]
Possible candidate: [{'e feist raymond': 60}]
lengthNecessary: 13.4
[{'e feist raymond': 60}]
['e feist raymond'] VS true_author: ['e feist raymond']
ISBN: 0060827130
true author: Baigent Michael
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18007397651672363
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.018429040908813477
Discarted candidate: [{'leigh richard': 2}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigen

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.37802696228027344
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01898789405822754
Discarted candidate: [{'baynes pauline': 3}, {'baynes c lewis pauline s': 1}, {'baynes pauline': 1}, {'baynes pauline': 1}, {'baynes pauline': 1}, {'baynes pauline': 1}, {'baynes pauline': 1}, {'baynes pauline': 1}, {'baynes pauline': 1}]
Possible candidate: [{'c lewis s': 96}]
lengthNecessary: 21.400000000000002
[{'c lewis s': 96}]
['c lewis s'] VS true_author: ['c lewis s']
ISBN: 0140004211
true author: Graves Robert
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19820189476013184
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.007302999496459961
Discarted candidate: [{'graves robert': 2}, {'graver robert': 1}, {'graves robert': 1}, {'graves robert': 1}, {

Blocking time is: 0.011430978775024414
Discarted candidate: [{'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'m pollen': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}]
Possible candidate: [{'michael pollan': 85}]
lengthNecessary: 18.8
[{'michael pollan': 85}]
['michael pollan'] VS true_author: ['michael pollan']
ISBN: 0151001006
true author: Guterson David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.34870457649230957
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.0745091438293457
Discarted candidate: [{'studios': 1}, {'david guterson pictures universal': 1}, {'jr': 1}, {'f guste roy': 1}, {'david guterson': 1}, {'d guterson': 1}, {'d guterson': 1}, {'david guterson': 1}, {'david guterson': 1}]
Possible candidate: [{'david guterson': 241}]
lengthNecessary: 50.0
[{'david guterson': 241}]
['d

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3520641326904297
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.027215957641601562
Discarted candidate: [{'venturi': 3}, {'br denise scott': 1}, {'venturi': 1}, {'venturi': 1}, {'brown izenourdenise robert scott venturisteven': 1}, {'venturi': 1}, {'robert venturi': 1}]
Possible candidate: [{'izenour robert venturi': 3, 'robert venturi': 55}, {'azenour steven': 1, 'izenour steven': 41}, {'brown denise scott': 39}]
lengthNecessary: 29.6
[{'izenour robert venturi': 3, 'robert venturi': 55}, {'azenour steven': 1, 'izenour steven': 41}, {'brown denise scott': 39}]
['robert venturi', 'izenour steven', 'brown denise scott'] VS true_author: ['robert venturi', 'brown denise scott', 'izenour steven']
ISBN: 0300044402
true author: Saggs W. F. H.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding tim

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.34174084663391113
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.04759407043457031
Discarted candidate: [{'meyer stephanie': 6}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}]
Possible candidate: [{'meyer stephenie': 190}]
lengthNecessary: 40.800000000000004
[{'meyer stephenie': 190}]
['meyer stephenie'] VS true_author: ['meyer stephenie']
ISBN: 0316109304
true author: Bronowski J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12566184997558594
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015898704528808594
Discarted candidate: [{'bronowski j': 1}, {'bronowski jacob': 1}, {'bronowski j': 1}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3286769390106201
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02613091468811035
Discarted candidate: [{'jacket keith parkinson': 1}, {'art': 1}, {'feinman jeffrey': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}]
Possible candidate: [{'brooks terry': 107}]
lengthNecessary: 23.200000000000003
[{'brooks terry': 107}]
['brooks terry'] VS true_author: ['brooks terry']
ISBN: 0345371984
true author: Adams Douglas,Carwardine Mark
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.27324914932250977
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.021151065826416016
Discarted candidate: [{'adams': 5}, {'carwardine mark': 2}, {'carwardine mark': 1}, {'carwardine mark': 1

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23523807525634766
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.016150951385498047
Discarted candidate: [{'b greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}]
Possible candidate: [{'brian greene': 83}]
lengthNecessary: 18.400000000000002
[{'brian greene': 83}]
['brian greene'] VS true_author: ['brian greene']
ISBN: 0375414967
true author: Russo Richard
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1992037296295166
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015089035034179688
Discarted candidate: [{'richard russo': 2}, {'r russo': 1}, {'richard russo': 1}, {'richard russo': 1}, {'richard russo': 1}, {'ri

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2224888801574707
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02409219741821289
Discarted candidate: [{'marian schwartz': 12}, {'edward radzinsky': 2}, {'clifford dowdey': 2}, {'edvard radzinsky': 2}, {'marian schwartz transl': 1}, {'photos': 1}, {'edvard marian radzinsky schwartz': 1}, {'edvard radzinsky w': 1}, {'marian schwartz trans': 1}]
Possible candidate: [{'edvard radzinskii': 4, 'edvard radzinsky': 103}]
lengthNecessary: 26.0
[{'edvard radzinskii': 4, 'edvard radzinsky': 103}]
['edvard radzinsky'] VS true_author: ['edvard radzinsky']
ISBN: 0385425473
true author: Chang Jung
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23803305625915527
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.013000249862670898
Discarted candidate: [{'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.24352192878723145
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.0256040096282959
Discarted candidate: [{'a rice': 6}, {'anne rice': 2}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}]
Possible candidate: [{'anne rice': 123}]
lengthNecessary: 27.6
[{'anne rice': 123}]
['anne rice'] VS true_author: ['anne rice']
ISBN: 0394502787
true author: Pagels Elaine
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12839603424072266
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008625984191894531
Discarted candidate: [{'elaine h pagels': 9}, {'elaine pagels': 4}, {'elaine pagels': 3}, {'elaine h pagels': 2}, {'elaine pagels': 1}, {'elaine pagels': 1}, {'elaine pagels': 1}]
Po

Blocking time is: 0.24939608573913574
Discarted candidate: [{'rosalynn': 53}, {'cartere jimmy': 2, 'jimmy': 15}, {'crater jimmy': 2}, {'rosalynn': 1}, {'rosalynn': 1}, {'rosalynn': 1}, {'rosalynn': 1}, {'rosalynn y': 1}]
Possible candidate: [{'carter jimmy': 228}, {'*signed carter rosalynn': 2, 'carter rosalynn': 162}]
lengthNecessary: 93.80000000000001
[{'carter jimmy': 228}, {'*signed carter rosalynn': 2, 'carter rosalynn': 162}]
['carter jimmy', 'carter rosalynn'] VS true_author: ['carter jimmy', 'carter rosalynn']
ISBN: 0394561236
true author: Gore Vidal
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2241051197052002
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.022170066833496094
Discarted candidate: [{'box edgar': 2}, {'gore vidal': 1}, {'box edgar': 1}, {'box edgar': 1}, {'box edgar': 1}, {'box edgar': 1}, {'j robert stanton': 1}, {'box edgar': 1}, {'eric lustbader van': 1}]
P

[{'clifton fadiman': 54}]
['clifton fadiman'] VS true_author: ['clifton fadiman']
ISBN: 0395486025
true author: Least Heat-Moon William
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5600259304046631
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.10028791427612305
Discarted candidate: [{'heat moon': 29}, {'heat l moon william': 2, 'heat least moon william': 9}, {'heat-moon least': 5}, {'heat-moon': 4}, {'white': 3}, {'black photographs': 3}, {'e i trogdon william': 2}, {'hank stuever': 2}, {'heat-moon least wm': 1}]
Possible candidate: [{'heat-moon least william': 211, 'least william': 29}]
lengthNecessary: 60.0
[{'heat-moon least william': 211, 'least william': 29}]
['heat-moon least william'] VS true_author: ['heat-moon least william']
ISBN: 0395488842
true author: Harrison Jim
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.22634029388427734
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.011304140090942383
Discarted candidate: [{'carol colman': 19}, {'gary heaven': 1}, {'gary heavin': 1}, {'gary heavin': 1}, {'carol colman': 1}, {'gary heavin': 1}, {'gary heavin': 1}, {'gary heavin': 1}, {'gary heavin': 1}]
Possible candidate: [{'gary heavin': 70}]
lengthNecessary: 19.400000000000002
[{'gary heavin': 70}]
['gary heavin'] VS true_author: ['gary heavin', 'carol colman']
ISBN: 0399157824
true author: Cussler Clive,Brown Graham
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2631690502166748
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.021939992904663086
Discarted candidate: [{'brown graham': 4}, {'clive cussler': 2}, {'brown graham': 1}, {'adventure austin ku

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3486959934234619
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.032109737396240234
Discarted candidate: [{'collectif': 2}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}]
Possible candidate: [{'briggs patricia': 156}]
lengthNecessary: 33.2
[{'briggs patricia': 156}]
['briggs patricia'] VS true_author: ['briggs patricia']
ISBN: 0446387878
true author: Dorris Michael
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1660289764404297
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014390945434570312
Discarted candidate: [{'dorris michael': 2}, {'dorris morris': 1}, {'dorris michael': 1}, {'dorris michae

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2613959312438965
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.010837078094482422
Discarted candidate: [{'hawking stephen': 7}, {'krauss lawrence': 3}, {'foreword hawking stephen': 2}, {'krauss': 1}, {'albee edward': 1}, {'krauss lawrence m w': 1}, {'m': 1}, {'foreword': 1}]
Possible candidate: [{'krauss lawrence m': 72}]
lengthNecessary: 17.8
[{'krauss lawrence m': 72}]
['krauss lawrence m'] VS true_author: ['krauss lawrence m']
ISBN: 051511779X
true author: Roberts Nora
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18505382537841797
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.013020992279052734
Discarted candidate: [{'noraauthor roberts': 1}, {'nora roberts': 1}, {'nora roberts': 1}, {'nora roberts': 1}, {'nora roberts': 1}, {'nora

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.4898672103881836
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.07112812995910645
Discarted candidate: [{'a iacocca lee': 29}, {'a et iacocca lee novak william': 2}, {'iacocca lee w': 2}, {'novak wm': 2}, {'iacocca l': 1}, {'iacocca l': 1}, {'iacocca lee': 1}, {'iacocca lee': 1}]
Possible candidate: [{'iacocca lee': 153}, {'novak william': 60}]
lengthNecessary: 50.400000000000006
[{'iacocca lee': 153}, {'novak william': 60}]
['iacocca lee', 'novak william'] VS true_author: ['iacocca lee']
ISBN: 0553051253
true author: Benford Gregory,Brin David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19764280319213867
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01940321922302246
Discarted candidate: [{'ad benford brin david gregory': 1}, {'brin

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.257692813873291
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.022578954696655273
Discarted candidate: [{'fulrimari jeffrey': 2, 'fulvimari jeffrey': 10}, {'fulrimari jeffrey madonna': 4, 'fulvimari jeffrey madonna': 1, 'louise madonna': 1}, {'ciccone madonna': 1, 'madonna ritchie': 3}, {'blue': 1, 'fulvimari': 1, 'hand signed': 1}, {'blue in ink madonna written': 1, 'color delightful fulvimari in jeffrey whimsically': 1}, {'designed dj masuda toshiya': 1}, {'rock singer the': 1}, {'endpapers guaranteed pink': 1}, {'her is married name': 1}]
Possible candidate: [{'by madonna': 1, 'fulvimari madonna': 1, 'madona': 1, 'madonna': 95}]
lengthNecessary: 25.8
[{'by madonna': 1, 'fulvimari madonna': 1, 'madona': 1, 'madonna': 95}]
['madonna'] VS true_author: ['madonna']
ISBN: 0670063568
true author: Keillor Garrison
embedding_type: inferSent
att

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1621870994567871
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009161949157714844
Discarted candidate: [{'boyle coraghessan t': 2}, {'coraghessan': 1}, {'c': 1}, {'boyle c t': 1}, {'boyd malcolm': 1}, {'boyle c t': 1}, {'boyle c t': 1}]
Possible candidate: [{'boyle c t': 62}, {'boyle coraghessan t': 18, 'boyle t': 1}]
lengthNecessary: 17.8
[{'boyle c t': 62}, {'boyle coraghessan t': 18, 'boyle t': 1}]
['boyle c t', 'boyle coraghessan t'] VS true_author: ['boyle c t']
ISBN: 0670891916
true author: Bradford Sarah
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1421527862548828
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009515047073364258
Discarted candidate: [{'bradford sarah': 2}, {'kennedy': 1}, {'jacqueline onassis': 1}, {'bradford sa

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3958897590637207
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.056054115295410156
Discarted candidate: [{'collier': 2}, {'horowitz peter': 1}, {'collier horo': 1}, {'peter': 1}, {'h perkin': 1}, {'collier peter': 1}, {'collier peter': 1}, {'horowitz': 1}]
Possible candidate: [{'collier peter': 110}, {'david horowitz': 101}]
lengthNecessary: 44.0
[{'collier peter': 110}, {'david horowitz': 101}]
['collier peter', 'david horowitz'] VS true_author: ['collier peter', 'david horowitz']
ISBN: 0671622617
true author: Prager Dennis,Telushkin Joseph
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1773090362548828
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.018591880798339844
Discarted candidate: [{'joseph telushkin': 2}, {'joseph rabbi telushk

Blocking time is: 0.019473791122436523
Discarted candidate: [{'chang jung': 1}, {'halliday jon': 1}, {'chang jung': 1}, {'halliday jon': 1}, {'chang jung': 1}, {'halliday jon': 1}, {'chang jung': 1}, {'halliday jon': 1}]
Possible candidate: [{'chang jung': 65}, {'halliday jon': 56}]
lengthNecessary: 25.8
[{'chang jung': 65}, {'halliday jon': 56}]
['chang jung', 'halliday jon'] VS true_author: ['chang jung', 'halliday jon']
ISBN: 0679425411
true author: Shaara Michael
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11337900161743164
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.006421089172363281
Discarted candidate: [{'michael shaara': 4}, {'michael shaara': 1}, {'bob loomis': 1}, {'shaara': 1}, {'shaara': 1}, {'michael shaara': 1}, {'michael shaara': 1}]
Possible candidate: [{'michael shaara': 61}]
lengthNecessary: 14.200000000000001
[{'michael shaara': 61}]
['michael shaara'] VS true

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18686485290527344
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.007080078125
Discarted candidate: [{'conway jill': 1, 'conway jill k': 1, 'conway jill kathryn': 1, 'conway jill kerr': 2}, {'jill ker': 1, 'ker': 1}, {'american autobiographies herself of vol women': 1}, {'conway': 1}, {'cecilia gaposchkin payne': 1}, {'anna howard shaw': 1}, {'anon': 1}]
Possible candidate: [{'conway jill ker': 60}]
lengthNecessary: 14.4
[{'conway jill ker': 60}]
['conway jill ker'] VS true_author: ['conway jill ker']
ISBN: 0679762906
true author: Negroponte Nicholas
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20912408828735352
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.017268896102905273
Discarted candidate: [{'books house random vintage': 6}, {'as

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5142788887023926
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.06037282943725586
Discarted candidate: [{'bush k mildred': 8}, {'drew lisa': 6}, {'bush kerr mildred': 4}, {'as barbar bush dictated millie to': 2, 'as barbara bush dictated millie to': 2}, {'as barbara bush dedicated to': 2}, {'as barbara bush dictated to': 2}, {'millie': 2}, {'barbara bush millie': 2}]
Possible candidate: [{'barbara bush': 132}, {'bush millie': 65}]
lengthNecessary: 45.400000000000006
[{'barbara bush': 132}, {'bush millie': 65}]
['barbara bush', 'bush millie'] VS true_author: ['barbara bush']
ISBN: 0688075916
true author: Smith Jeff
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12999510765075684
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.00648498535156

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1284949779510498
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008354663848876953
Discarted candidate: [{'gregory philippa': 2}, {'gregory': 1}, {'gregory philippa': 1}, {'gregory philippa': 1}, {'gregory philippa': 1}, {'gregory philippa': 1}, {'gregory philippa': 1}]
Possible candidate: [{'gregory philippa': 67}]
lengthNecessary: 15.0
[{'gregory philippa': 67}]
['gregory philippa'] VS true_author: ['gregory philippa']
ISBN: 0743249925
true author: Dunning John
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23673605918884277
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02188420295715332
Discarted candidate: [{'dunning john': 6}, {'dunning h john': 2}, {'dunning john': 1}, {'dunning john s': 1}, {'dunning john': 1}, {'dunning john': 1}

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23345518112182617
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.013375997543334961
Discarted candidate: [{'macomber': 8}, {'macomber': 2}, {'debbie macomber': 1}, {'macomber': 1}, {'macomber': 1}, {'macomber': 1}, {'macomber': 1}]
Possible candidate: [{'debbie macomber': 64}]
lengthNecessary: 15.8
[{'debbie macomber': 64}]
['debbie macomber'] VS true_author: ['debbie macomber']
ISBN: 0785211578
true author: Anderson Ken
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3780789375305176
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015998125076293945
Discarted candidate: [{'hayes john': 11}, {'anderson ken': 1}, {'anderson ken': 1}, {'anderson ken': 1}, {'anderson ken': 1}, {'anderson ken': 1}, {'anderson ken': 1}, {'anderson ken': 1}, {'an

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17277908325195312
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015378952026367188
Discarted candidate: [{'carter jimmy': 2}, {'*author carter jimmy signed': 1}, {'carter j': 1}, {'carter jimmy': 1}, {'carter jimmy': 1}, {'carter jimmy': 1}, {'carter jimmy': 1}, {'carter jimmy': 1}, {'carter jimmy': 1}]
Possible candidate: [{'carter jimmy': 104}]
lengthNecessary: 22.8
[{'carter jimmy': 104}]
['carter jimmy'] VS true_author: ['carter jimmy']
ISBN: 0824602560
true author: Kolatch J. Alfred
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.13875198364257812
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009541988372802734
Discarted candidate: [{'alred j kolatch': 1}, {'kolatch': 1}, {'alfred kolatch': 1}, {'rabbi': 1}, {'alfred j kolatch': 1},

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20855498313903809
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.017323017120361328
Discarted candidate: [{'get shorty': 1}, {'ellmore leonard': 1}, {'elmore leonard': 1}, {'elmore leonard': 1}, {'elmore leonard': 1}, {'elmore leonard': 1}, {'elmore leonard': 1}, {'elmore leonard': 1}, {'elmore leonard': 1}]
Possible candidate: [{'elmore leonard': 112}]
lengthNecessary: 24.200000000000003
[{'elmore leonard': 112}]
['elmore leonard'] VS true_author: ['elmore leonard']
ISBN: 0877958416
true author: Leonard Elmore
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.21038007736206055
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01906108856201172
Discarted candidate: [{'art cover': 1}, {'kathawala': 1}, {'elmore leanard': 1}, {'elmore leonard': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.14838767051696777
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.010753870010375977
Discarted candidate: [{'albom': 1}, {'albom mitch': 1}, {'albom mitch': 1}, {'albom mitch': 1}, {'albom mitch': 1}, {'albom mitch': 1}, {'albom mitch': 1}, {'albom mitch': 1}, {'albom mitch': 1}]
Possible candidate: [{'albom mitch': 84}]
lengthNecessary: 18.6
[{'albom mitch': 84}]
['albom mitch'] VS true_author: ['albom mitch']
ISBN: 1401323588
true author: Colfer Eoin
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.16513323783874512
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.011178970336914062
Discarted candidate: [{'colfer eoin': 2}, {'colfer eoin': 1}, {'adams douglas': 1}, {'colfer eoin': 1}, {'colfer eoin': 1}, {'colfer eoin': 1}, {'colfer eoin': 1

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17694377899169922
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.0058307647705078125
Discarted candidate: [{'c fiorina': 1}, {'carly fiorina': 1}, {'carly fiorina': 1}, {'carly fiorina': 1}, {'carly fiorina': 1}, {'carly fiorina': 1}]
Possible candidate: [{'carly fiorina': 58}]
lengthNecessary: 12.8
[{'carly fiorina': 58}]
['carly fiorina'] VS true_author: ['carly fiorina']
ISBN: 1594201455
true author: Pollan Michael
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23650193214416504
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.011717081069946289
Discarted candidate: [{'pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}, {'michael pollan': 1}

In [6]:
from evaluation import *

# Old cases

In [13]:
getEvaluation(finalAuthors, trueAuthors, 1)

precision is 0.8682295877122069
recall is 0.9597855227882037
f1Score is 0.9117147707979626


(0.8682295877122069, 0.9597855227882037, 0.9117147707979626)

In [8]:
getEvaluation(finalAuthors, trueAuthors, 1)

precision is 0.9014567266495287
recall is 0.9401251117068812
f1Score is 0.9203849518810149


(0.9014567266495287, 0.9401251117068812, 0.9203849518810149)

# With multiple wins and remove similar one

In [7]:
getEvaluation(finalAuthors, trueAuthors, 1)

TP: 1058, FP: 230, FN: 61
precision is 0.8214285714285714
recall is 0.9454870420017873
f1Score is 0.8791026173660157


(0.8214285714285714, 0.9454870420017873, 0.8791026173660157)