In [1]:
import os
import sys
import time
import numpy as np
import matplotlib.pyplot as plt
module_path = os.path.abspath(os.path.join('../../fusion'))
sys.path.append(module_path)

from preprocessing_datasets.preprocessing_utilities import ValueUtils
from preprocessing_datasets import load_dataset
from embedding_algorithms import sentence_embedding, set_embedding_model
from dimensionality_reduction_algorithms import dimension_reduction_algorithms
from cluster_algorithms import cluster_algorithm

from helper import load_by_index, get_author_candidates, getFinalAuthors, launchWithoutReductionFusion
from plot_tools import plotChart, plotCluster

In [2]:
key_values = {
    'model_type':'bilstm',
    'char_level':False,
    'model_version': 2,
    'rnn_dim':1024,
    'verbose':1,
    'attributes_list': ['author'],
    'embedding_type': 'inferSent',
    'dataset': 'clean_book',
    'cluster_method': 'hierarchy',
    'num_clusters_rate': 0.1,
    'block_length_thresold': 0.2,
}

In [3]:
dataset_name, table_group_by_isbn, isbn_list, true_authors = load_dataset(key_values)

dataset: clean_book
Loading time is: 2.3436758518218994


In [4]:
set_embedding_model(key_values)

Vocab size : 2196017
model_version: 2
rnn_dim: 1024
model_type: bilstm
char_level: False
Setup time is: 205.4702537059784


In [5]:
start_time = time.time()
finalAuthors, trueAuthors = launchWithoutReductionFusion(table_group_by_isbn, isbn_list, true_authors, key_values)
print("Total time is: {0}".format(time.time() - start_time))

ISBN: 0007197160
true author: Marren Peter
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 1.013118028640747
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.1833782196044922
Discarted candidate: [{'conservation officer': 2, 'former scientist': 2}, {'marren naturalist peter': 2}]
Possible candidate: [{'marren peter': 19}]
lengthNecessary: 5.0
[{'marren peter': 19}]
['marren peter'] VS true_author: ['marren peter']
ISBN: 0029011086
true author: Averill James R.,Nunley Elma P.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08344602584838867
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0017910003662109375
Discarted candidate: [{'elma nunley p': 4}, {'averill': 1, 'james r': 1}]
Possible candidate: [{'averill james r': 21}]
lengthNecessary: 5.4
[{'averill james r': 21}]
['averill james r'] VS

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11447477340698242
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.005087852478027344
Discarted candidate: [{'george witte': 1, 'glenn': 3}, {'van zutphen': 3}, {'schmitt': 3}, {'bernd': 3}]
Possible candidate: [{'bernd schmitt': 25}, {'glenn van zutphen': 19}]
lengthNecessary: 11.4
[{'bernd schmitt': 25}, {'glenn van zutphen': 19}]
['bernd schmitt', 'glenn van zutphen'] VS true_author: ['bernd schmitt', 'glenn van zutphen']
ISBN: 0241113873
true author: Critchley Julian
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.049327850341796875
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0021390914916992188
Discarted candidate: [{'colin wheeler': 1}]
Possible candidate: [{'critchley': 1, 'critchley julian': 17}]
lengthNecessary: 3.8000000000000003

Blocking time is: 0.0017881393432617188
Discarted candidate: [{'maurice thompson': 1}]
Possible candidate: [{'moritz thomsen': 16}]
lengthNecessary: 3.4000000000000004
[{'moritz thomsen': 16}]
['moritz thomsen'] VS true_author: ['moritz thomsen']
ISBN: 0439436559
true author: Nix Garth
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08751487731933594
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.004102230072021484
Discarted candidate: [{'garth nix': 2}, {'garth nix': 1}, {'garth nix': 1}, {'garth nix': 1}, {'garth nix': 1}]
Possible candidate: [{'garth nix': 45}]
lengthNecessary: 10.200000000000001
[{'garth nix': 45}]
['garth nix'] VS true_author: ['garth nix']
ISBN: 0439670195
true author: Kerr P. B.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2638280391693115
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUST

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.30017709732055664
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.012361288070678711
Discarted candidate: [{'donald katz': 18}, {'adult viking': 1}, {'adult viking': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}]
Possible candidate: [{'donald katz r': 76}]
lengthNecessary: 20.400000000000002
[{'donald katz r': 76}]
['donald katz r'] VS true_author: ['donald katz r']
ISBN: 0671640984
true author: Turnbull Colin M.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11473894119262695
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.005485057830810547
Discarted candidate: [{'colin turnbull': 7}, {'turnbull': 2}, {'colin m turnbull': 1}, {'colin m turnbull': 1}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10061907768249512
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002640962600708008
Discarted candidate: [{'beattie william': 5}, {'beatty dr william': 1}, {'beattie w': 1}]
Possible candidate: [{'a m ross': 1, 'alexander m ross': 22, 'alexander ross': 1}]
lengthNecessary: 6.2
[{'a m ross': 1, 'alexander m ross': 22, 'alexander ross': 1}]
['alexander m ross'] VS true_author: ['alexander m ross']
ISBN: 0802115462
true author: Weddle David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.059667348861694336
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001646280288696289
Discarted candidate: [{'american heritage': 1}]
Possible candidate: [{'david peckinpah re sam weddle': 1, 'david weddle': 16}]
lengthNecessary: 3.6
[{'david peckinpah re sam w

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07565808296203613
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0024139881134033203
Discarted candidate: [{'johnston ollie': 1}]
Possible candidate: [{'johnston ollie': 18}, {'frank thomas': 9}]
lengthNecessary: 5.6000000000000005
[{'johnston ollie': 18}, {'frank thomas': 9}]
['johnston ollie', 'frank thomas'] VS true_author: ['johnston ollie', 'frank thomas']
ISBN: 159558191X
true author: Moby,Park Miyun
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09482407569885254
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0036001205444335938
Discarted candidate: [{'miyun park': 7}, {'moby park': 2}, {'and miyun park': 1}, {'moby': 1}]
Possible candidate: [{'moby': 35}]
lengthNecessary: 9.200000000000001
[{'moby': 35}]
['moby'] VS true_author: ['

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.31500697135925293
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014396905899047852
Discarted candidate: [{'doug welsch': 6}, {'doug welsh': 2, 'douglas welsh': 1, 'doyg welsh': 1, 'welsh': 2}, {'connie effefson': 1, 'connie ellefson': 3, 'connie ellefson l': 1, 'connie ellefson loc': 1}, {'lockhart thomas': 1, 'steph thomas': 1, 'stephens tom': 3}, {'ellefson stephens': 2, 'stephens': 1, 'stephens tho': 1}, {'l': 1}, {'dough welsh': 1}]
Possible candidate: [{'connie ellefson lockhart': 28, 'connie lockhart': 1}, {'l stephens thomas': 25}, {'douglas ellefson f welsh': 1, 'douglas f welsh': 23}]
lengthNecessary: 21.400000000000002
[{'connie ellefson lockhart': 28, 'connie lockhart': 1}, {'l stephens thomas': 25}, {'douglas ellefson f welsh': 1, 'douglas f welsh': 23}]
['connie ellefson lockhart', 'l stephens thomas', 'douglas f welsh'] VS 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2825767993927002
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.00667881965637207
Discarted candidate: [{'alec guiness': 1}, {'alec guinness': 1}, {'alec guinness': 1}, {'alec guinness': 1}, {'alec guinness': 1}, {'alec guinness': 1}]
Possible candidate: [{'alec guinness': 58}]
lengthNecessary: 12.8
[{'alec guinness': 58}]
['alec guinness'] VS true_author: ['alec guinness']
ISBN: 029777283X
true author: Richards J. M.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04851508140563965
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0011379718780517578
Discarted candidate: []
Possible candidate: [{'j m richards': 5, 'j richards': 1, 'james maude richards': 1, 'm': 1}]
lengthNecessary: 1.6
[{'j m richards': 5, 'j richards': 1, 'james maude richa

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3331730365753174
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.012552976608276367
Discarted candidate: [{'beaton c m': 1}, {'ann beattie': 1}, {'ann beattie': 1}, {'ann beattie': 1}, {'ann beattie': 1}, {'ann beattie': 1}]
Possible candidate: [{'ann beattie': 56}]
lengthNecessary: 12.4
[{'ann beattie': 56}]
['ann beattie'] VS true_author: ['ann beattie']
ISBN: 0395138841
true author: Farris Martin T.,Sampson Roy J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0858008861541748
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0012972354888916016
Discarted candidate: []
Possible candidate: [{'farris m y': 1, 'farris martin t': 4, 'j r simpson': 1, 'j roy sampson': 1}]
lengthNecessary: 1.4000000000000001
[{'farris m y': 1, 'farris martin t': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06491708755493164
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.004522085189819336
Discarted candidate: [{'konstantin papagiannaki': 1}, {'konstantina papagiannaki': 1}, {'konstantina papagiannaki': 1}, {'konstantina papagiannaki': 1}]
Possible candidate: [{'antonio nucci': 33}, {'konstantina papagiannaki': 16, 'nucci': 4}]
lengthNecessary: 11.4
[{'antonio nucci': 33}, {'konstantina papagiannaki': 16, 'nucci': 4}]
['antonio nucci', 'konstantina papagiannaki'] VS true_author: ['antonio nucci', 'konstantina papagiannaki']
ISBN: 0571109020
true author: Christie A. B.,Christie Mary C.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0446619987487793
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0007491111755371094
Discarted candidate: []
Possi

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07899904251098633
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.003237009048461914
Discarted candidate: [{'george ulrich': 4}, {'jan karon': 1}, {'jan karon': 1}]
Possible candidate: [{'jan karon': 34}]
lengthNecessary: 8.0
[{'jan karon': 34}]
['jan karon'] VS true_author: ['jan karon']
ISBN: 0765366665
true author: Wiehl Lis,Henry April
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0691690444946289
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0031270980834960938
Discarted candidate: [{'april henry': 1}, {'lis wiehl': 1}, {'april henry': 1}]
Possible candidate: [{'lis wiehl': 24}, {'april henry': 19}]
lengthNecessary: 9.200000000000001
[{'lis wiehl': 24}, {'april henry': 19}]
['lis wiehl', 'april henry'] VS true_author: ['lis wiehl', '

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11415815353393555
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.00544285774230957
Discarted candidate: [{'assis tov': 1}, {'yom': 1}, {'folberg': 1}, {'folberg neil photography': 1}]
Possible candidate: [{'folberg neil': 26, 'neil': 1}, {'assis tov yom': 24}]
lengthNecessary: 11.0
[{'folberg neil': 26, 'neil': 1}, {'assis tov yom': 24}]
['folberg neil', 'assis tov yom'] VS true_author: ['folberg neil']
ISBN: 0908228082
true author: Mollison Bill,Slay Reny Mia
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05091094970703125
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001177072525024414
Discarted candidate: [{'mia reny slay': 2}]
Possible candidate: [{'bill mollison': 11}]
lengthNecessary: 2.6
[{'bill mollison': 11}]
['bill mollison'] VS

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2911972999572754
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.010025978088378906
Discarted candidate: [{'kaplan robert steven': 4}, {'davenport h thomas': 3}, {'kaplan rs': 3}, {'dp norton': 3}, {'david norton p': 1}, {'david norton p': 1}, {'david norton p': 1}, {'david norton p': 1}]
Possible candidate: [{'kaplan robert s': 41}, {'david norton p': 34}]
lengthNecessary: 18.400000000000002
[{'kaplan robert s': 41}, {'david norton p': 34}]
['kaplan robert s', 'david norton p'] VS true_author: ['kaplan robert s', 'david norton p']
ISBN: 1851774882
true author: Ajmar-Wollheim Marta,Dennis Flora
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04262399673461914
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001486063003540039
Discarted candid

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04692196846008301
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0020542144775390625
Discarted candidate: []
Possible candidate: [{'e frank r': 4, 'e frank ronald': 1, 'g greenberg m': 2}]
lengthNecessary: 1.4000000000000001
[{'e frank r': 4, 'e frank ronald': 1, 'g greenberg m': 2}]
['e frank r'] VS true_author: ['e frank ronald', 'g greenberg marshall']
ISBN: 0904230112
true author: Mondey David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05835413932800293
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0032062530517578125
Discarted candidate: [{'ross stanley': 6}, {'david mondey': 2}, {'david money': 1}]
Possible candidate: [{'david mondey': 25}]
lengthNecessary: 6.800000000000001
[{'david mondey': 25}]
['david mondey'] VS true_author

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06484723091125488
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.00251007080078125
Discarted candidate: [{'clooney george': 1}, {'hudson jeff': 1}, {'hudson jeff': 1}]
Possible candidate: [{'hudson jeff': 30}]
lengthNecessary: 6.6000000000000005
[{'hudson jeff': 30}]
['hudson jeff'] VS true_author: ['hudson jeff']
ISBN: 0002007908
true author: Heath Joseph,Potter Andrew
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.060805320739746094
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0019316673278808594
Discarted candidate: [{'unnamed': 1}]
Possible candidate: [{'heath joseph': 13, 'joseph': 1}, {'andrew heath potter': 1, 'andrew potter': 13}]
lengthNecessary: 5.800000000000001
[{'heath joseph': 13, 'joseph': 1}, {'andrew heath potter': 1, 'a

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10857987403869629
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0019259452819824219
Discarted candidate: [{'belash phillips rachel trans': 1, 'inth mexico of other solitude the': 1, 'milos yara': 1, 'return to': 1}, {'kemp lysander': 3}]
Possible candidate: [{'octavio paz': 19}]
lengthNecessary: 5.2
[{'octavio paz': 19}]
['octavio paz'] VS true_author: ['octavio paz']
ISBN: 0895265222
true author: Meese Edwin III
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.039392948150634766
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0006358623504638672
Discarted candidate: []
Possible candidate: [{'edwin iii meese': 1, 'edwin meese': 1}]
lengthNecessary: 0.4
[{'edwin iii meese': 1, 'edwin meese': 1}]
['edwin iii meese'] VS true_author: ['edwin iii

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06308269500732422
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0016880035400390625
Discarted candidate: [{'business of': 1}, {'business of the': 1}]
Possible candidate: [{'adam horowitz': 19}]
lengthNecessary: 4.2
[{'adam horowitz': 19}]
['adam horowitz'] VS true_author: ['adam horowitz']
ISBN: 0316104671
true author: Boyle T. Coraghessan
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.03424525260925293
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0008919239044189453
Discarted candidate: []
Possible candidate: [{'boyle c t': 1, 'boyle coraghessan t': 1}]
lengthNecessary: 0.4
[{'boyle c t': 1, 'boyle coraghessan t': 1}]
['boyle c t'] VS true_author: ['boyle coraghessan t']
ISBN: 0273642383
true author: Kolk Ans
embedding_type: inferSent


embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05708718299865723
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0017819404602050781
Discarted candidate: [{'albert diianni': 1}]
Possible candidate: [{'a griffin james': 16}]
lengthNecessary: 3.4000000000000004
[{'a griffin james': 16}]
['a griffin james'] VS true_author: ['a griffin james']
ISBN: 0855616881
true author: Solomon Charmaine
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04642510414123535
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0014460086822509766
Discarted candidate: []
Possible candidate: [{'charmaine solomon': 4, 'nina solomon': 2}]
lengthNecessary: 1.2000000000000002
[{'charmaine solomon': 4, 'nina solomon': 2}]
['charmaine solomon'] VS true_author: ['charmaine solomon']
ISBN: 0399117962
true author: Robinson Spid

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09602212905883789
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.003798961639404297
Discarted candidate: [{'betina krahn m': 8}, {'betina krahn m': 1}, {'betina krahn': 1}, {'betina krahn': 1}, {'betina krahn': 1}]
Possible candidate: [{'betina krahn': 40}]
lengthNecessary: 10.4
[{'betina krahn': 40}]
['betina krahn'] VS true_author: ['betina krahn']
ISBN: 1555424155
true author: Desatnick Robert L.,Detzel Denis H.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08187413215637207
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.00261688232421875
Discarted candidate: [{'desatnick l robert': 1}, {'denis detzel h': 1}]
Possible candidate: [{'desanick l robert': 1, 'desatnick l robert': 18}, {'denis detzel h': 12}]
lengthNecessary: 6.600000000000

Blocking time is: 0.010216236114501953
Discarted candidate: [{'eugene price': 1}, {'eugenia price': 1}, {'eugenia price': 1}, {'eugenia price': 1}, {'eugenia price': 1}, {'eugenia price': 1}]
Possible candidate: [{'eugenia price': 58}]
lengthNecessary: 12.8
[{'eugenia price': 58}]
['eugenia price'] VS true_author: ['eugenia price']
ISBN: 0898158621
true author: Miller Mark,MacLauchlan Andrew,Harrisson John
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.13423895835876465
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0032651424407958984
Discarted candidate: [{'charles mark miller': 2}, {'harrisson john': 2}, {'mark mi': 1}]
Possible candidate: [{'mark miller': 20}, {'andrew maclauchian': 1, 'andrew maclauchlan': 19}]
lengthNecessary: 9.0
[{'mark miller': 20}, {'andrew maclauchian': 1, 'andrew maclauchlan': 19}]
['mark miller', 'andrew maclauchlan'] VS true_author: ['mark miller', 'andre

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.076904296875
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001984119415283203
Discarted candidate: []
Possible candidate: [{'conn dr george h': 3, 'conn george': 1, 'conn george h': 1, 'conn george harold': 8, 'george h': 1}, {'conn': 1, 'elsie v': 1, 'h': 1, 'hanauer': 1, 'horse library lovers wilshire': 1}]
lengthNecessary: 3.8000000000000003
[{'conn dr george h': 3, 'conn george': 1, 'conn george h': 1, 'conn george harold': 8, 'george h': 1}, {'conn': 1, 'elsie v': 1, 'h': 1, 'hanauer': 1, 'horse library lovers wilshire': 1}]
['conn george harold', 'conn'] VS true_author: ['conn george h']
ISBN: 0385293917
true author: Olsen Jack
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.03978610038757324
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08635902404785156
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002485990524291992
Discarted candidate: [{'alvin kerr': 1, 'federico helen': 1}, {'arie dezanger': 1, 'townsend': 1}]
Possible candidate: [{'adams': 1, 'adams charlotte': 19}, {'doris m townsend': 1, 'doris mcferran townsend': 8}]
lengthNecessary: 6.6000000000000005
[{'adams': 1, 'adams charlotte': 19}, {'doris m townsend': 1, 'doris mcferran townsend': 8}]
['adams charlotte', 'doris mcferran townsend'] VS true_author: ['adams charlotte', 'doris mcferran townsend']
ISBN: 0380018136
true author: Asimov Isaac
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05599474906921387
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0019469261169433594
Discarted candidate: [{'asimov isaac': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2921299934387207
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.017879009246826172
Discarted candidate: [{'chaucher': 1, 'coghill nevill': 9}, {'chaucer': 1, 'chaucer geofrey': 1}, {'coghill nevil': 1}, {'coghill nevill': 1}, {'coghill nevill': 1}, {'coghill nevill': 1}, {'coghill nevill': 1}, {'coghill nevil trans': 1}, {'h liddell mark': 1}]
Possible candidate: [{'chaucer geoffrey': 103}]
lengthNecessary: 24.400000000000002
[{'chaucer geoffrey': 103}]
['chaucer geoffrey'] VS true_author: ['chaucer geoffrey']
ISBN: 0072859342
true author: Getlein Mark
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05601215362548828
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0026030540466308594
Discarted candidate: [{'gilbert rita': 1}, {'getlein mark

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18359994888305664
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.016035079956054688
Discarted candidate: [{'llywelyn': 1}, {'scott': 1}, {'llywelyn morgan': 1}, {'llywelyn morgan': 1}, {'llywelyn morgan': 1}, {'llywelyn morgan': 1}, {'llywelyn morgan': 1}, {'llywelyn morgan': 1}]
Possible candidate: [{'michael scott': 54}, {'llywelyn morgan': 50}]
lengthNecessary: 22.400000000000002
[{'michael scott': 54}, {'llywelyn morgan': 50}]
['michael scott', 'llywelyn morgan'] VS true_author: ['llywelyn morgan', 'michael scott']
ISBN: 0801040264
true author: Hendriksen William
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04207611083984375
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015549659729003906
Discarted candidate: []
Possible candidate

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09351801872253418
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0021109580993652344
Discarted candidate: [{'a': 1, 'administration space': 1, 'm': 1}]
Possible candidate: [{'aeronautics national s u': 1, 'd launius roger': 10, 'j lear linda': 1}, {'a day dwayne': 9, 'day dwayne': 1}, {'john logsdon': 1, 'john logsdon m': 8}]
lengthNecessary: 6.800000000000001
[{'aeronautics national s u': 1, 'd launius roger': 10, 'j lear linda': 1}, {'a day dwayne': 9, 'day dwayne': 1}, {'john logsdon': 1, 'john logsdon m': 8}]
['d launius roger', 'a day dwayne', 'john logsdon m'] VS true_author: ['john logsdon m', 'a day dwayne', 'd launius roger']
ISBN: 086554915X
true author: Hunt James L.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.054705142974853516
cluster_method: hierarchy
num_clu

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.43744492530822754
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.04180717468261719
Discarted candidate: [{'nixon richard': 2}, {'nixon richard': 1}, {'nixon richard': 1}, {'nixon richard': 1}, {'nixon richard': 1}, {'nixon richard': 1}, {'nixon richard': 1}, {'nixon richard': 1}]
Possible candidate: [{'milhous nixon richard': 8, 'nixon richard': 125}, {'m nixon richard': 44}]
lengthNecessary: 37.2
[{'milhous nixon richard': 8, 'nixon richard': 125}, {'m nixon richard': 44}]
['nixon richard', 'm nixon richard'] VS true_author: ['nixon richard']
ISBN: 0070378150
true author: Lieberman Ernest D.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05453610420227051
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001306295394897461
Discarted candida

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3352200984954834
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.011073827743530273
Discarted candidate: [{'barber e': 1}, {'barber elizabeth w': 1}, {'barber e j': 1}, {'barber elizabeth wayland': 1}, {'barber elizabeth wayland': 1}, {'barber elizabeth wayland': 1}, {'barber elizabeth wayland': 1}]
Possible candidate: [{'barber elizabeth wayland': 51}, {'barber e j w': 27}]
lengthNecessary: 17.0
[{'barber elizabeth wayland': 51}, {'barber e j w': 27}]
['barber elizabeth wayland', 'barber e j w'] VS true_author: ['barber elizabeth wayland']
ISBN: 0370013476
true author: Taylor E. G. R.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06210803985595703
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0010988712310791016
Discarted candidate: []
P

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05386996269226074
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0014488697052001953
Discarted candidate: [{'seymour': 1}]
Possible candidate: [{'ana seymour': 13}]
lengthNecessary: 2.8000000000000003
[{'ana seymour': 13}]
['ana seymour'] VS true_author: ['ana seymour']
ISBN: 1922147249
true author: Learmonth Eleanor,Tabakoff Jenny
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07295799255371094
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.003070831298828125
Discarted candidate: [{'eleanor learmonth': 1}, {'jenny tabakoff': 1}]
Possible candidate: [{'eleanor learmonth': 24}, {'jenny tabakoff': 14}]
lengthNecessary: 8.0
[{'eleanor learmonth': 24}, {'jenny tabakoff': 14}]
['eleanor learmonth', 'jenny tabakoff'] VS true_author: ['eleanor le

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1960139274597168
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.016211986541748047
Discarted candidate: [{'irving jim': 7}, {'irving john': 1}, {'irving john': 1}, {'irving john': 1}, {'irving john': 1}, {'irving john': 1}, {'irving john': 1}, {'irving john': 1}, {'irving john': 1}]
Possible candidate: [{'irving john': 98}]
lengthNecessary: 22.6
[{'irving john': 98}]
['irving john'] VS true_author: ['irving john']
ISBN: 0962782548
true author: Fisher Donna,Vilas Sandy
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07899594306945801
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002360105514526367
Discarted candidate: [{'conna vilas': 1, 'donna vilas': 1}, {'sandy': 1}]
Possible candidate: [{'sandy vilas': 24}, {'donna fisher': 7}]
lengthN

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05258917808532715
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0034821033477783203
Discarted candidate: [{'chant chris': 1}]
Possible candidate: [{'chant christopher': 11}, {'chant chris': 9}]
lengthNecessary: 4.2
[{'chant christopher': 11}, {'chant chris': 9}]
['chant christopher', 'chant chris'] VS true_author: ['chant chris']
ISBN: 0262081601
true author: Holland John H.,Holyoak Keith J.,Nisbett Richard E.,Thagard Paul R.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05715489387512207
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0014350414276123047
Discarted candidate: []
Possible candidate: [{'aa vv': 1, 'e nisbet richard': 1, 'e nisbett richard': 1, 'holyoak j keith': 1, 'paul r thaga': 1, 'paul r thagard': 1, 'paul thagard': 1},

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06017804145812988
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.003139019012451172
Discarted candidate: [{'lev raphael': 2}, {'lee raphael': 1}]
Possible candidate: [{'lev raphael': 20}]
lengthNecessary: 4.6000000000000005
[{'lev raphael': 20}]
['lev raphael'] VS true_author: ['lev raphael']
ISBN: 019925933X
true author: New Steve,Westbrook Roy
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05479598045349121
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001207113265991211
Discarted candidate: []
Possible candidate: [{'j new steve': 1, 'new steve': 7, 'oxford press university': 1}, {'roy westbrook': 4}]
lengthNecessary: 2.6
[{'j new steve': 1, 'new steve': 7, 'oxford press university': 1}, {'roy westbrook': 4}]
['new steve', 'roy westbroo

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12483000755310059
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0026040077209472656
Discarted candidate: [{'corrigan g grace': 2}, {'corrigan geor grace': 1}, {'corrigan grace': 1}]
Possible candidate: [{'corrigan george grace': 31}]
lengthNecessary: 7.0
[{'corrigan george grace': 31}]
['corrigan george grace'] VS true_author: ['corrigan george grace']
ISBN: 0884042855
true author: Hubbard L. Ron
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10009312629699707
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002892017364501953
Discarted candidate: [{'hubbard r ron': 6}, {'hubbard l ron': 1}, {'hubbard l ron': 1}]
Possible candidate: [{'hubbard l ron': 32}]
lengthNecessary: 8.0
[{'hubbard l ron': 32}]
['hubbard l ron'] VS true_author: ['hubb

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06130790710449219
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0016939640045166016
Discarted candidate: []
Possible candidate: [{'grieve maud': 15}, {'grieve kr?uter m naturheilkunde': 1, 'grieve m': 4}]
lengthNecessary: 4.0
[{'grieve maud': 15}, {'grieve kr?uter m naturheilkunde': 1, 'grieve m': 4}]
['grieve maud', 'grieve m'] VS true_author: ['grieve m']
ISBN: 0869202057
true author: Jack Alex D.,Cobban D. G.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.042815208435058594
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.001992940902709961
Discarted candidate: []
Possible candidate: [{'alex d jack': 5, 'cobban d g': 2, 'h s williams': 1}]
lengthNecessary: 1.6
[{'alex d jack': 5, 'cobban d g': 2, 'h s williams': 1}]
['alex d jack'] VS tr

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09950017929077148
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002415895462036133
Discarted candidate: [{'b d jacobs m michael': 2}, {'jacobs michael': 1}, {'d m': 1}]
Possible candidate: [{'b jacobs michael': 27}]
lengthNecessary: 6.2
[{'b jacobs michael': 27}]
['b jacobs michael'] VS true_author: ['b jacobs michael']
ISBN: 2226005773
true author: Sabatier Robert
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05927014350891113
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0015702247619628906
Discarted candidate: [{'robert sabatier': 2}, {'sabatier': 1}]
Possible candidate: [{'robert sabatier': 20}]
lengthNecessary: 4.6000000000000005
[{'robert sabatier': 20}]
['robert sabatier'] VS true_author: ['robert sabatier']
ISBN: 0674073010
true

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2939610481262207
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.03116583824157715
Discarted candidate: [{'margaret peden sayers': 20}, {'from margaret peden sayers spanish the': 1}, {'margaret peden sayers trans': 1}, {'allende isabel': 1}, {'allende isabel': 1}, {'allende isabel': 1}, {'allende isabel': 1}, {'allende isabel': 1}, {'allende isabel': 1}]
Possible candidate: [{'allende isabel': 120}]
lengthNecessary: 29.6
[{'allende isabel': 120}]
['allende isabel'] VS true_author: ['allende isabel']
ISBN: 0060171324
true author: Erdrich Louise
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1332240104675293
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.0068149566650390625
Discarted candidate: [{'erdrich louise': 4}, {'erdrich louise': 1}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18155980110168457
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009169340133666992
Discarted candidate: [{'bloom harold': 11}, {'bloom harold interpretation': 1}, {'an bloom harold interpretation': 1}, {'meyer': 1}, {'notes': 1}, {'marvin meyer w': 1}, {'marvin meyer w': 1}]
Possible candidate: [{'marvin meyer w': 45}, {'marvin meyer': 22}]
lengthNecessary: 16.8
[{'marvin meyer w': 45}, {'marvin meyer': 22}]
['marvin meyer w', 'marvin meyer'] VS true_author: ['marvin meyer']
ISBN: 0060731583
true author: Franks Tommy,McConnell Malcolm
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3742790222167969
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.05502200126647949
Discarted candidate: [{'franks r tommy': 26}, {'central': 1, 'in': 1, 'r': 1}

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3422880172729492
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.05031228065490723
Discarted candidate: [{'defelice ji': 1}, {'mcewen scott': 1}, {'mcewen scott': 1}, {'mcewen scott': 1}, {'mcewen scott': 1}, {'mcewen scott': 1}, {'mcewen scott': 1}]
Possible candidate: [{'chris kyle': 81}, {'defelice jim': 66}, {'mcewen scott': 60}]
lengthNecessary: 42.800000000000004
[{'chris kyle': 81}, {'defelice jim': 66}, {'mcewen scott': 60}]
['chris kyle', 'defelice jim', 'mcewen scott'] VS true_author: ['chris kyle', 'mcewen scott', 'defelice jim']
ISBN: 0062701789
true author: Woods Earl,McDaniel Pete,Woods Tiger
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20850300788879395
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014307975769042969
Dis

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3145792484283447
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.04250335693359375
Discarted candidate: [{'bull george': 21}, {'an bull castiglione george': 2}, {'baldesar': 2}, {'an bull george': 2}, {'bull castiglione': 2}, {'baldesar castiglione': 1}, {'baldesar castiglione': 1}, {'baldesar castiglione': 1}, {'baldesar castiglione': 1}]
Possible candidate: [{'baldassare castiglione': 13, 'baldassarre castiglione': 4, 'baldesa castiglione': 2, 'baldesar castiglione': 130}]
lengthNecessary: 36.4
[{'baldassare castiglione': 13, 'baldassarre castiglione': 4, 'baldesa castiglione': 2, 'baldesar castiglione': 130}]
['baldesar castiglione'] VS true_author: ['baldesar castiglione']
ISBN: 0140445927
true author: Homer 
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2019760608673095

Blocking time is: 0.012820005416870117
Discarted candidate: [{'faber michael': 10}, {'faber m': 1}, {'faber michel': 1}, {'faber michel': 1}, {'faber michel': 1}, {'faber michel': 1}, {'faber michel': 1}, {'faber michel': 1}, {'faber michel': 1}]
Possible candidate: [{'faber michel': 86}]
lengthNecessary: 20.8
[{'faber michel': 86}]
['faber michel'] VS true_author: ['faber michel']
ISBN: 0156031442
true author: Grandin Temple,Johnson Catherine
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3769400119781494
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.0457911491394043
Discarted candidate: [{'speaker': 2}, {'collectif': 1}, {'grandin t': 1}, {'joh': 1}, {'d dr ph': 1}, {'grandin': 1}, {'d grandin ph temple': 1}, {'d grandin ph temple': 1}]
Possible candidate: [{'grandin temple': 103}, {'catherine johnson': 91}]
lengthNecessary: 40.6
[{'grandin temple': 103}, {'catherine johnson': 91}]

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5200250148773193
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.04025411605834961
Discarted candidate: [{'howard means': 2}, {'howard means': 2}, {'currie elliott': 1}, {'currie elliott': 1}, {'freeh j louis': 1}, {'freeh j louis': 1}, {'freeh j louis': 1}, {'freeh j louis': 1}, {'freeh j louis': 1}]
Possible candidate: [{'freeh j louis': 180}]
lengthNecessary: 38.2
[{'freeh j louis': 180}]
['freeh j louis'] VS true_author: ['freeh j louis']
ISBN: 0312567480
true author: Cast C. P.,Cast Kristin
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.4256300926208496
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.05445218086242676
Discarted candidate: [{'cast krist': 1}, {'kristin': 1}, {'kristin': 1}, {'kristin': 1}, {'c cast p': 1}, {'c cast p':

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1527881622314453
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.011867761611938477
Discarted candidate: [{'david sedaris': 2}, {'d sedaris': 1}, {'david sedaris': 1}, {'david sedaris': 1}, {'david sedaris': 1}, {'david sedaris': 1}, {'david sedaris': 1}, {'david sedaris': 1}]
Possible candidate: [{'david sedaris': 81}]
lengthNecessary: 18.0
[{'david sedaris': 81}]
['david sedaris'] VS true_author: ['david sedaris']
ISBN: 0340696761
true author: Milton Giles
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.27251672744750977
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.03466391563415527
Discarted candidate: [{'greg milton': 2}, {'mi': 1}, {'mi': 1}, {'giles milton': 1}, {'giles milton': 1}, {'giles milton': 1}, {'giles milton': 1}, {'giles 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17640089988708496
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01138615608215332
Discarted candidate: [{'gary gianni': 9}, {'chabon michael': 1}, {'gary gianni': 1}, {'chabon michael': 1}, {'gary gianni': 1}, {'chabon michael': 1}, {'chabon michael': 1}, {'chabon michael': 1}, {'chabon michael': 1}]
Possible candidate: [{'chabon michael': 79}]
lengthNecessary: 19.200000000000003
[{'chabon michael': 79}]
['chabon michael'] VS true_author: ['chabon michael']
ISBN: 0345803485
true author: James L E
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19132494926452637
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008642196655273438
Discarted candidate: [{'fifty gray of shades': 1}, {'el james': 1}, {'e james l': 1}, {'e el james l': 1}, {'e jam

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2918281555175781
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01797795295715332
Discarted candidate: [{'al design dj nagy': 2}, {'christensen dave dj ration': 2}, {'king stephen': 1}, {'king stephen': 1}, {'king stephen': 1}, {'king stephen': 1}, {'king stephen': 1}, {'king stephen': 1}, {'king stephen': 1}]
Possible candidate: [{'king stephen': 110}]
lengthNecessary: 24.200000000000003
[{'king stephen': 110}]
['king stephen'] VS true_author: ['king stephen']
ISBN: 0385232497
true author: Plimpton George
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.21166205406188965
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009480953216552734
Discarted candidate: [{'a george plimpton': 1}, {'w': 1}, {'jr': 1}, {'aldrich nelson': 1}, {'george plim

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2207038402557373
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.016345977783203125
Discarted candidate: [{'jr mosley walter': 2}, {'mosley w': 1}, {'jr mosley walter': 1}, {'jr mosley walter': 1}, {'jr mosley walter': 1}, {'jr mosley walter': 1}, {'jr mosley walter': 1}, {'brent glass': 1}, {'jr mosley walter': 1}]
Possible candidate: [{'mosley walter': 98}]
lengthNecessary: 21.6
[{'mosley walter': 98}]
['mosley walter'] VS true_author: ['mosley walter']
ISBN: 0393034267
true author: Knox Bernard
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1253340244293213
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.0046062469482421875
Discarted candidate: [{'bernard knox macgregor walker': 10}, {'b knox': 2, 'knox': 1}, {'bernard knox m w': 3}, {'b

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2795288562774658
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009074926376342773
Discarted candidate: [{'hogan randolph': 6}, {'gabriel garc?a m?rquez': 3, 'gabriel garc?a mrquez': 1}, {'garbriel garcia marquez': 1, 'garcia marquez': 1}, {'edith grossman': 1}, {'***nobel author gabriel prize-winning': 1}, {'gabriel garc?a m?rquez': 1}, {'gabriel garcia-marquez': 1}, {'gabriel garc?a m?rquez': 1}]
Possible candidate: [{'gabriel garcia marquez': 71}]
lengthNecessary: 17.6
[{'gabriel garcia marquez': 71}]
['gabriel garcia marquez'] VS true_author: ['gabriel garcia marquez']
ISBN: 0394551540
true author: Michener A. James
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.24099993705749512
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01898288

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2803840637207031
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.00787496566772461
Discarted candidate: [{'gannet ruth stiles': 1}, {'chrisman gannett ruth': 1}, {'chrisman gannett ruth': 1}, {'gannett ruth stiles': 1}, {'gannett ruth stiles': 1}, {'gannett ruth stiles': 1}, {'gannett ruth stiles': 1}]
Possible candidate: [{'gannett ruth stiles': 66}]
lengthNecessary: 14.600000000000001
[{'gannett ruth stiles': 66}]
['gannett ruth stiles'] VS true_author: ['gannett ruth stiles']
ISBN: 0395305098
true author: Galbraith Kenneth John
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23101472854614258
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014500856399536133
Discarted candidate: [{'galbraith john kenneth': 2}, {'galbraith john k': 1}, {'g

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2403700351715088
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02379918098449707
Discarted candidate: [{'d koontz': 1}, {'dean koontz': 1}, {'dean koontz': 1}, {'dean koontz': 1}, {'dean koontz': 1}, {'dean koontz': 1}, {'dean koontz': 1}, {'dean koontz': 1}]
Possible candidate: [{'dean koontz': 69}, {'dean koontz r': 34}]
lengthNecessary: 22.200000000000003
[{'dean koontz': 69}, {'dean koontz r': 34}]
['dean koontz', 'dean koontz r'] VS true_author: ['dean koontz']
ISBN: 0399139869
true author: Gibbons Kaye
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3462038040161133
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02651214599609375
Discarted candidate: [{'gibbons kaye': 2}, {'gibbons kate': 1}, {'gibbons kaye': 1}, {'gibbons kaye': 1

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2706410884857178
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.023176193237304688
Discarted candidate: [{'grandpr mary': 7, 'grandpre mary': 5}, {'k': 1}, {'grandpr jacket mary': 1}, {'j rowling': 1}, {'art': 1}, {'danielle steel': 1}, {'j k rowling': 1}, {'j k rowling': 1}, {'j k rowling': 1}]
Possible candidate: [{'j k rowling': 120}]
lengthNecessary: 28.0
[{'j k rowling': 120}]
['j k rowling'] VS true_author: ['j k rowling']
ISBN: 0439784549
true author: Rowling K. J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5273218154907227
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.08574295043945312
Discarted candidate: [{'grandpr mary': 14, 'grandpre mary': 5}, {'grandpre illus mary': 2}, {'illus': 2}, {'j k rowlings': 1}, {'j k rowling'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23534512519836426
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.00839090347290039
Discarted candidate: [{'ladin': 1}, {'bin carmen laden': 1}, {'marshall ruth': 1}, {'marshall ruth': 1}, {'marshall ruth': 1}, {'bin carmen ladin': 1}, {'bin carmen ladin': 1}]
Possible candidate: [{'bin carmen ladin': 70}]
lengthNecessary: 15.4
[{'bin carmen ladin': 70}]
['bin carmen ladin'] VS true_author: ['bin carmen ladin']
ISBN: 0451222350
true author: Ward R. J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.26572704315185547
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.011938095092773438
Discarted candidate: [{'j ward': 5}, {'j r ward': 1}, {'j r ward': 1}, {'j r ward': 1}, {'j r ward': 1}, {'j r ward': 1}, {'j r ward': 1}, {'j r ward': 1}, {'j r 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2753181457519531
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008838891983032227
Discarted candidate: [{'follett ken': 2}, {'bellow saul': 1}, {'follet ken': 1}, {'follett ken': 1}, {'follett ken': 1}, {'follett ken': 1}, {'follett ken': 1}]
Possible candidate: [{'follett ken': 71}]
lengthNecessary: 15.8
[{'follett ken': 71}]
['follett ken'] VS true_author: ['follett ken']
ISBN: 0545010225
true author: Rowling K. J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.6126861572265625
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.12251496315002441
Discarted candidate: [{'grandpr mary': 20, 'grandpre mary': 3}, {'jk rowling': 3}, {'j rowling': 2}, {'grandpre j k mary rowling': 2}, {'grandpr mary': 1}, {'grandpr mary': 1}, {'grandpre mary': 1}

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20084190368652344
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.008186101913452148
Discarted candidate: [{'james pd': 1}, {'baroness d james p': 1}, {'baroness d james p': 1}, {'baroness d james p': 1}, {'baroness d james p': 1}, {'baroness d james p': 1}, {'baroness d james p': 1}]
Possible candidate: [{'d james p': 57}, {'baroness d james p': 17}]
lengthNecessary: 16.2
[{'d james p': 57}, {'baroness d james p': 17}]
['d james p', 'baroness d james p'] VS true_author: ['d james p']
ISBN: 0609600575
true author: Masson Moussaieff Jeffrey
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.15531110763549805
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.010811090469360352
Discarted candidate: [{'j masson moussaieff': 14}, {'l masson thomas': 1

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17800593376159668
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.0178987979888916
Discarted candidate: [{'mcmillan terry': 2}, {'hersey john': 1}, {'mcmillan t': 1}, {'mcmillan terry': 1}, {'mcmillan terry': 1}, {'mcmillan terry': 1}, {'mcmillan terry': 1}, {'mcmillan terry': 1}, {'mcmillan terry': 1}]
Possible candidate: [{'mcmillan terry': 116}]
lengthNecessary: 25.200000000000003
[{'mcmillan terry': 116}]
['mcmillan terry'] VS true_author: ['mcmillan terry']
ISBN: 0670844527
true author: King Stephen
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17473316192626953
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.018739938735961914
Discarted candidate: [{'king stephen': 2}, {'peter straub': 1}, {'king stephen': 1}, {'king stephen': 1}, {

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.16643595695495605
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01601886749267578
Discarted candidate: [{'allison d': 1}, {'allison': 1}, {'allison dorothy': 1}, {'allison dorothy': 1}, {'allison dorothy': 1}, {'allison dorothy': 1}, {'allison dorothy': 1}, {'allison dorothy': 1}, {'allison dorothy': 1}]
Possible candidate: [{'allison dorothy': 100}]
lengthNecessary: 21.8
[{'allison dorothy': 100}]
['allison dorothy'] VS true_author: ['allison dorothy']
ISBN: 0399152601
true author: Spurlock Morgan
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17409086227416992
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.010937929153442383
Discarted candidate: [{'morgan spurlocks': 2}, {'morgan spurlock': 2}, {'morgan spurlock': 1}, {'morgan spurlock

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19353222846984863
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02337813377380371
Discarted candidate: [{'matthiessen peter': 4}, {'becky saletan': 1}, {'epstein jason': 1}, {'frank mary': 1}, {'matthiessen peter': 1}, {'matthiessen peter': 1}, {'matthiessen peter': 1}, {'matthiessen peter': 1}, {'matthiessen peter': 1}]
Possible candidate: [{'matthiessen peter': 120}]
lengthNecessary: 26.400000000000002
[{'matthiessen peter': 120}]
['matthiessen peter'] VS true_author: ['matthiessen peter']
ISBN: 0679401342
true author: Michener A. James
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.42246413230895996
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.058953046798706055
Discarted candidate: [{'james michener': 8}, {'a james michener': 1}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.16910004615783691
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.01041102409362793
Discarted candidate: [{'edward osborne wilson': 9}, {'edward osbor wilson': 1}, {'edward osborne wilson': 1}, {'edward o wilson': 1}, {'edward o wilson': 1}, {'edward o wilson': 1}]
Possible candidate: [{'edward o wilson': 51}]
lengthNecessary: 13.0
[{'edward o wilson': 51}]
['edward o wilson'] VS true_author: ['edward o wilson']
ISBN: 0679450793
true author: Artzi-Pelossof Ben Noa
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.28533506393432617
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.0269620418548584
Discarted candidate: [{'artzi-pelossof noa': 2}, {'artzi-pelossof ben': 1}, {'artzi-pelossof ben': 1}, {'artzi ben pelossof': 1}, {'artzi ben pelossof'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1154181957244873
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.005688905715942383
Discarted candidate: [{'ferris t': 1}, {'ferris timothy': 1}, {'ferris timothy': 1}, {'ferris timothy': 1}, {'ferris timothy': 1}, {'ferris timothy': 1}]
Possible candidate: [{'ferris timothy': 59}]
lengthNecessary: 13.0
[{'ferris timothy': 59}]
['ferris timothy'] VS true_author: ['ferris timothy']
ISBN: 0684852217
true author: Proulx Annie
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.25922679901123047
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01954793930053711
Discarted candidate: [{'annie e proulx': 10}, {'annie proulx': 4}, {'matthews watercolors william': 1}, {'matthews williamiam': 1}, {'proulx': 1}, {'annie proulx': 1}, {'annie proulx': 1}, {'a

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.306812047958374
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.036278724670410156
Discarted candidate: [{'nancy': 2}, {'farmer': 1}, {'farmer': 1}, {'farmer nancy': 1}, {'farmer nancy': 1}, {'farmer nancy': 1}, {'farmer nancy': 1}, {'farmer nancy': 1}, {'farmer nancy': 1}]
Possible candidate: [{'farmer nancy': 171}]
lengthNecessary: 36.2
[{'farmer nancy': 171}]
['farmer nancy'] VS true_author: ['farmer nancy']
ISBN: 0689859392
true author: Black Holly,DiTerlizzi Tony
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.23560023307800293
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.0308840274810791
Discarted candidate: [{'diterlizzi t': 1}, {'black': 1}, {'black diterlizzi holly tony': 1}, {'black holly': 1}, {'black holly': 1}, {'black di ho

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3122439384460449
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.019974946975708008
Discarted candidate: [{'joanne k rowling': 8}, {'harry potter': 2}, {'book of order phoenix the': 2}, {'rowlin': 1}, {'rowlin': 1}, {'j k rowling': 1}, {'joanne k rowling': 1}, {'joanne k rowling': 1}, {'joanne k rowling': 1}]
Possible candidate: [{'j k rowling': 115}]
lengthNecessary: 26.6
[{'j k rowling': 115}]
['j k rowling'] VS true_author: ['j k rowling']
ISBN: 0747563209
true author: Schott Ben
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20391130447387695
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.010180950164794922
Discarted candidate: [{'conceived written': 2}, {'ben designed schott': 2}, {'written': 1}, {'ben conceived designed schott': 1}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1656341552734375
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015958070755004883
Discarted candidate: [{'lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}, {'john lanchester': 1}]
Possible candidate: [{'john lanchester': 103}]
lengthNecessary: 22.400000000000002
[{'john lanchester': 103}]
['john lanchester'] VS true_author: ['john lanchester']
ISBN: 0805064222
true author: Kanon Joseph
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.34067606925964355
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.053114891052246094
Discarted candidate: [{'***autographrd copy joseph kanon': 2}, {'harnett kane t': 1}, {'cha

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.22007393836975098
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.022654056549072266
Discarted candidate: [{'contributor-dean merrill': 1}, {'dean merrirll': 1}, {'burnham garacia': 1}, {'burnham garcia': 1}, {'burnham gracia': 1}, {'burnham gracia': 1}, {'burnham gracia': 1}, {'burnham gracia': 1}]
Possible candidate: [{'burnham gracia': 84}, {'dean merrill': 49}]
lengthNecessary: 28.200000000000003
[{'burnham gracia': 84}, {'dean merrill': 49}]
['burnham gracia', 'dean merrill'] VS true_author: ['burnham gracia', 'dean merrill']
ISBN: 0849911796
true author: Peretti Frank
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1832273006439209
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.013999700546264648
Discarted candidate: [{'countryman ja

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.26107287406921387
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.043357133865356445
Discarted candidate: [{'champy hammer~james michael': 1, 'michael': 1}, {'champy janes': 1}, {'champy hammer james': 1}, {'hammer micheal': 1}, {'hammer james michael': 1}, {'champy': 1}, {'dr': 1}, {'hammer michael': 1}]
Possible candidate: [{'hammer michael': 69}, {'champy james': 63}]
lengthNecessary: 28.200000000000003
[{'hammer michael': 69}, {'champy james': 63}]
['hammer michael', 'champy james'] VS true_author: ['hammer michael', 'champy james']
ISBN: 089296720X
true author: Maron Margaret
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.21250700950622559
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.009747982025146484
Discarted candidate: [{'margar

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.15891194343566895
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.013842105865478516
Discarted candidate: [{'bill breen': 17}, {'g hamel': 3}, {'hamel': 3}, {'bill breen': 1}, {'bill breen': 1}, {'bill breen': 1}, {'bill breen': 1}, {'bill breen': 1}, {'bill breen': 1}]
Possible candidate: [{'gary hamel': 71}]
lengthNecessary: 20.0
[{'gary hamel': 71}]
['gary hamel'] VS true_author: ['gary hamel', 'bill breen']
ISBN: 1476729085
true author: Simsion Graeme
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12015223503112793
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008332014083862305
Discarted candidate: [{'c graeme simsion': 4}, {'graeme simsion': 1}, {'graeme simsion': 1}, {'graeme simsion': 1}, {'graeme simsion': 1}, {'graeme simsion': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3496971130371094
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.021319866180419922
Discarted candidate: [{'frieberg kevin': 2}, {'freiberg': 1}, {'freiberg jackie kevin': 1}, {'peters tom': 1}, {'freiberg jackie kevin': 1}, {'forward jackie peters tom': 1}, {'freiberg~foreword freiberg~jackie kevin peters tom': 1}, {'peters tom': 1}]
Possible candidate: [{'freiberg kevin': 31, 'frieberg kevin': 61}, {'freiberg jackie': 30}]
lengthNecessary: 26.200000000000003
[{'freiberg kevin': 31, 'frieberg kevin': 61}, {'freiberg jackie': 30}]
['frieberg kevin', 'freiberg jackie'] VS true_author: ['freiberg kevin', 'freiberg jackie']
ISBN: 1885203292
true author: Lewis W. Richard
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.28211307525634766
cluster_method: hierarchy
num_clusters_rate: 

In [6]:
from evaluation import *

In [13]:
getEvaluation(finalAuthors, trueAuthors, 1)

precision is 0.8682295877122069
recall is 0.9597855227882037
f1Score is 0.9117147707979626


(0.8682295877122069, 0.9597855227882037, 0.9117147707979626)

In [8]:
getEvaluation(finalAuthors, trueAuthors, 1)

precision is 0.9014567266495287
recall is 0.9401251117068812
f1Score is 0.9203849518810149


(0.9014567266495287, 0.9401251117068812, 0.9203849518810149)