In [2]:
import os
import sys
import time
import numpy as np
import matplotlib.pyplot as plt
module_path = os.path.abspath(os.path.join('../../fusion'))
sys.path.append(module_path)

from preprocessing_datasets.preprocessing_utilities import ValueUtils
from preprocessing_datasets import load_dataset
from embedding_algorithms import sentence_embedding, set_embedding_model
from dimensionality_reduction_algorithms import dimension_reduction_algorithms
from cluster_algorithms import cluster_algorithm

from helper import load_by_index, get_author_candidates, getFinalAuthors, launchWithoutReductionFusion
from plot_tools import plotChart, plotCluster

In [3]:
key_values = {
    'model_type':'bilstm',
    'char_level':False,
    'model_version': 2,
    'rnn_dim':1024,
    'verbose':1,
    'attributes_list': ['author'],
    'embedding_type': 'inferSent',
    'dataset': 'clean_book',
    'cluster_method': 'hierarchy',
    'num_clusters_rate': 0.1,
    'block_length_thresold': 0.2,
}

In [4]:
dataset_name, table_group_by_isbn, isbn_list, true_authors = load_dataset(key_values)

dataset: clean_book
Loading time is: 2.319929838180542


In [5]:
set_embedding_model(key_values)

Vocab size : 2196017
model_version: 2
rnn_dim: 1024
model_type: bilstm
char_level: False
Setup time is: 189.85926985740662


In [6]:
start_time = time.time()
finalAuthors, trueAuthors = launchWithoutReductionFusion(table_group_by_isbn, isbn_list, true_authors, key_values)
print("Total time is: {0}".format(time.time() - start_time))

ISBN: 0007197160
true author: Marren Peter
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.38725709915161133
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.19257497787475586
Discarted candidate: [{'conservation officer': 2, 'former scientist': 2}, {'marren naturalist peter': 2}]
Possible candidate: [{'marren peter': 19}]
lengthNecessary: 5.0
[{'marren peter': 19}]
['marren peter'] VS true_author: ['marren peter']
ISBN: 0029011086
true author: Averill James R.,Nunley Elma P.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11423897743225098
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0021071434020996094
Discarted candidate: [{'elma nunley p': 4}, {'averill': 1, 'james r': 1}]
Possible candidate: [{'averill james r': 21}]
lengthNecessary: 5.4
[{'averill james r': 21}]
['averill james r']

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2179279327392578
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.010634899139404297
Discarted candidate: [{'george witte': 1, 'glenn': 3}, {'van zutphen': 3}, {'schmitt': 3}, {'bernd': 3}]
Possible candidate: [{'bernd schmitt': 25}, {'glenn van zutphen': 19}]
lengthNecessary: 11.4
[{'bernd schmitt': 25}, {'glenn van zutphen': 19}]
['bernd schmitt', 'glenn van zutphen'] VS true_author: ['bernd schmitt', 'glenn van zutphen']
ISBN: 0241113873
true author: Critchley Julian
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06004786491394043
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0013499259948730469
Discarted candidate: [{'colin wheeler': 1}]
Possible candidate: [{'critchley': 1, 'critchley julian': 17}]
lengthNecessary: 3.8000000000000003
[

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04537320137023926
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001667022705078125
Discarted candidate: [{'maurice thompson': 1}]
Possible candidate: [{'moritz thomsen': 16}]
lengthNecessary: 3.4000000000000004
[{'moritz thomsen': 16}]
['moritz thomsen'] VS true_author: ['moritz thomsen']
ISBN: 0439436559
true author: Nix Garth
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08526015281677246
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.004390716552734375
Discarted candidate: [{'garth nix': 2}, {'garth nix': 1}, {'garth nix': 1}, {'garth nix': 1}, {'garth nix': 1}]
Possible candidate: [{'garth nix': 45}]
lengthNecessary: 10.200000000000001
[{'garth nix': 45}]
['garth nix'] VS true_author: ['garth nix']
ISBN: 0439670195
true author: Kerr 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2308642864227295
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.012603998184204102
Discarted candidate: [{'donald katz': 18}, {'adult viking': 1}, {'adult viking': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}, {'donald katz r': 1}]
Possible candidate: [{'donald katz r': 76}]
lengthNecessary: 20.400000000000002
[{'donald katz r': 76}]
['donald katz r'] VS true_author: ['donald katz r']
ISBN: 0671640984
true author: Turnbull Colin M.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2112867832183838
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.005922079086303711
Discarted candidate: [{'colin turnbull': 7}, {'turnbull': 2}, {'colin m turnbull': 1}, {'colin m turnbull': 1}, {'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05817699432373047
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0013041496276855469
Discarted candidate: [{'american heritage': 1}]
Possible candidate: [{'david peckinpah re sam weddle': 1, 'david weddle': 16}]
lengthNecessary: 3.6
[{'david peckinpah re sam weddle': 1, 'david weddle': 16}]
['david weddle'] VS true_author: ['david weddle']
ISBN: 0805048332
true author: Brodkey Harold
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.030803203582763672
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0012760162353515625
Discarted candidate: []
Possible candidate: [{'brodkey harold': 2, 'bruno giuseppe': 1}]
lengthNecessary: 0.6000000000000001
[{'brodkey harold': 2, 'bruno giuseppe': 1}]
['brodkey harold'] VS true_author: ['brodkey harold']
ISBN:

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.14728665351867676
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0025000572204589844
Discarted candidate: [{'johnston ollie': 1}]
Possible candidate: [{'johnston ollie': 18}, {'frank thomas': 9}]
lengthNecessary: 5.6000000000000005
[{'johnston ollie': 18}, {'frank thomas': 9}]
['johnston ollie', 'frank thomas'] VS true_author: ['johnston ollie', 'frank thomas']
ISBN: 159558191X
true author: Moby,Park Miyun
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09402227401733398
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.003461122512817383
Discarted candidate: [{'miyun park': 7}, {'moby park': 2}, {'and miyun park': 1}, {'moby': 1}]
Possible candidate: [{'moby': 35}]
lengthNecessary: 9.200000000000001
[{'moby': 35}]
['moby'] VS true_author: ['m

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3561370372772217
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014636993408203125
Discarted candidate: [{'doug welsch': 6}, {'doug welsh': 2, 'douglas welsh': 1, 'doyg welsh': 1, 'welsh': 2}, {'connie effefson': 1, 'connie ellefson': 3, 'connie ellefson l': 1, 'connie ellefson loc': 1}, {'lockhart thomas': 1, 'steph thomas': 1, 'stephens tom': 3}, {'ellefson stephens': 2, 'stephens': 1, 'stephens tho': 1}, {'l': 1}, {'dough welsh': 1}]
Possible candidate: [{'connie ellefson lockhart': 28, 'connie lockhart': 1}, {'l stephens thomas': 25}, {'douglas ellefson f welsh': 1, 'douglas f welsh': 23}]
lengthNecessary: 21.400000000000002
[{'connie ellefson lockhart': 28, 'connie lockhart': 1}, {'l stephens thomas': 25}, {'douglas ellefson f welsh': 1, 'douglas f welsh': 23}]
['connie ellefson lockhart', 'l stephens thomas', 'douglas f welsh'] VS t

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.13707280158996582
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.005262851715087891
Discarted candidate: [{'alec guiness': 1}, {'alec guinness': 1}, {'alec guinness': 1}, {'alec guinness': 1}, {'alec guinness': 1}, {'alec guinness': 1}]
Possible candidate: [{'alec guinness': 58}]
lengthNecessary: 12.8
[{'alec guinness': 58}]
['alec guinness'] VS true_author: ['alec guinness']
ISBN: 029777283X
true author: Richards J. M.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05149507522583008
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0009779930114746094
Discarted candidate: []
Possible candidate: [{'j m richards': 5, 'j richards': 1, 'james maude richards': 1, 'm': 1}]
lengthNecessary: 1.6
[{'j m richards': 5, 'j richards': 1, 'james maude ric

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10147619247436523
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 7
Blocking time is: 0.0052051544189453125
Discarted candidate: [{'beaton c m': 1}, {'ann beattie': 1}, {'ann beattie': 1}, {'ann beattie': 1}, {'ann beattie': 1}, {'ann beattie': 1}]
Possible candidate: [{'ann beattie': 56}]
lengthNecessary: 12.4
[{'ann beattie': 56}]
['ann beattie'] VS true_author: ['ann beattie']
ISBN: 0395138841
true author: Farris Martin T.,Sampson Roy J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.047979116439819336
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0009882450103759766
Discarted candidate: []
Possible candidate: [{'farris m y': 1, 'farris martin t': 4, 'j r simpson': 1, 'j roy sampson': 1}]
lengthNecessary: 1.4000000000000001
[{'farris m y': 1, 'farris martin 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06351089477539062
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.003008127212524414
Discarted candidate: [{'aa vv': 1}, {'weinberg': 1}, {'steven weinberg': 1}]
Possible candidate: [{'steven weinberg': 31}]
lengthNecessary: 6.800000000000001
[{'steven weinberg': 31}]
['steven weinberg'] VS true_author: ['steven weinberg']
ISBN: 0521880696
true author: Nucci Antonio,Papagiannaki Konstantina
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07127666473388672
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.005369901657104492
Discarted candidate: [{'konstantin papagiannaki': 1}, {'konstantina papagiannaki': 1}, {'konstantina papagiannaki': 1}, {'konstantina papagiannaki': 1}]
Possible candidate: [{'antonio nucci': 33}, {'konstantina papagiannaki':

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.0708308219909668
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.003431081771850586
Discarted candidate: [{'george ulrich': 4}, {'jan karon': 1}, {'jan karon': 1}]
Possible candidate: [{'jan karon': 34}]
lengthNecessary: 8.0
[{'jan karon': 34}]
['jan karon'] VS true_author: ['jan karon']
ISBN: 0765366665
true author: Wiehl Lis,Henry April
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06981301307678223
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0038580894470214844
Discarted candidate: [{'april henry': 1}, {'lis wiehl': 1}, {'april henry': 1}]
Possible candidate: [{'lis wiehl': 24}, {'april henry': 19}]
lengthNecessary: 9.200000000000001
[{'lis wiehl': 24}, {'april henry': 19}]
['lis wiehl', 'april henry'] VS true_author: ['lis wiehl', '

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.24695181846618652
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 6
Blocking time is: 0.008037805557250977
Discarted candidate: [{'assis tov': 1}, {'yom': 1}, {'folberg': 1}, {'folberg neil photography': 1}]
Possible candidate: [{'folberg neil': 26, 'neil': 1}, {'assis tov yom': 24}]
lengthNecessary: 11.0
[{'folberg neil': 26, 'neil': 1}, {'assis tov yom': 24}]
['folberg neil', 'assis tov yom'] VS true_author: ['folberg neil']
ISBN: 0908228082
true author: Mollison Bill,Slay Reny Mia
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06163907051086426
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015649795532226562
Discarted candidate: [{'mia reny slay': 2}]
Possible candidate: [{'bill mollison': 11}]
lengthNecessary: 2.6
[{'bill mollison': 11}]
['bill mollison'] 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.31462788581848145
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.012214183807373047
Discarted candidate: [{'kaplan robert steven': 4}, {'davenport h thomas': 3}, {'kaplan rs': 3}, {'dp norton': 3}, {'david norton p': 1}, {'david norton p': 1}, {'david norton p': 1}, {'david norton p': 1}]
Possible candidate: [{'kaplan robert s': 41}, {'david norton p': 34}]
lengthNecessary: 18.400000000000002
[{'kaplan robert s': 41}, {'david norton p': 34}]
['kaplan robert s', 'david norton p'] VS true_author: ['kaplan robert s', 'david norton p']
ISBN: 1851774882
true author: Ajmar-Wollheim Marta,Dennis Flora
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.043025970458984375
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001789093017578125
Discarted cand

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04912304878234863
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0012238025665283203
Discarted candidate: []
Possible candidate: [{'e frank r': 4, 'e frank ronald': 1, 'g greenberg m': 2}]
lengthNecessary: 1.4000000000000001
[{'e frank r': 4, 'e frank ronald': 1, 'g greenberg m': 2}]
['e frank r'] VS true_author: ['e frank ronald', 'g greenberg marshall']
ISBN: 0904230112
true author: Mondey David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07992982864379883
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002635955810546875
Discarted candidate: [{'ross stanley': 6}, {'david mondey': 2}, {'david money': 1}]
Possible candidate: [{'david mondey': 25}]
lengthNecessary: 6.800000000000001
[{'david mondey': 25}]
['david mondey'] VS true_author:

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08634185791015625
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0023250579833984375
Discarted candidate: [{'unnamed': 1}]
Possible candidate: [{'heath joseph': 13, 'joseph': 1}, {'andrew heath potter': 1, 'andrew potter': 13}]
lengthNecessary: 5.800000000000001
[{'heath joseph': 13, 'joseph': 1}, {'andrew heath potter': 1, 'andrew potter': 13}]
['heath joseph', 'andrew potter'] VS true_author: ['heath joseph', 'andrew potter']
ISBN: 0812974875
true author: Orlean Susan
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05624890327453613
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0015289783477783203
Discarted candidate: []
Possible candidate: [{'orlean s': 1, 'orlean susan': 1}]
lengthNecessary: 0.4
[{'orlean s': 1, 'orlean susan': 1}]
['o

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.15385794639587402
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0006771087646484375
Discarted candidate: []
Possible candidate: [{'jackson m william': 6, 'nan': 1}, {'billy eds evans joe': 1, 'billy evans joe': 3}]
lengthNecessary: 2.2
[{'jackson m william': 6, 'nan': 1}, {'billy eds evans joe': 1, 'billy evans joe': 3}]
['jackson m william', 'billy evans joe'] VS true_author: ['jackson m william', 'billie evans joe']
ISBN: 039446124X
true author: Boyer Richard O.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2306368350982666
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002972841262817383
Discarted candidate: [{'brown john': 1}, {'by': 1}]
Possible candidate: [{'boyer owen richard': 22}, {'boyer o rchard': 1, 'boyer o richard': 13, 'bo

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08123302459716797
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.00360107421875
Discarted candidate: [{'harmon henkin jeff johnson': 2}, {'jeff johnson': 1}, {'harmon henkin': 1}]
Possible candidate: [{'harmon henkin': 36}]
lengthNecessary: 8.0
[{'harmon henkin': 36}]
['harmon henkin'] VS true_author: ['harmon henkin']
ISBN: 0091800854
true author: Alibek Ken,Handelman Stephen
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04761695861816406
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0023119449615478516
Discarted candidate: [{'alibek ken': 1}]
Possible candidate: [{'handelman stephen': 11}, {'alibek ken': 11}]
lengthNecessary: 4.6000000000000005
[{'handelman stephen': 11}, {'alibek ken': 11}]
['handelman stephen', 'alibek ken'] VS true_

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20486998558044434
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.013251066207885742
Discarted candidate: [{'darrell k sweet': 2}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}]
Possible candidate: [{'brooks terry': 66}]
lengthNecessary: 14.8
[{'brooks terry': 66}]
['brooks terry'] VS true_author: ['brooks terry']
ISBN: 0671736493
true author: Carew Jack
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18923687934875488
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.023327350616455078
Discarted candidate: [{'carew': 1}, {'carew jack': 1}, {'carew jan': 1}, {'carew jack': 1}]
Possible candidate: [{'carew jack': 38}]
lengthNecessary: 8.4
[{'carew jack': 38}]
['carew 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.28668689727783203
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.011600971221923828
Discarted candidate: [{'f healy jeremiah': 13}, {'f healy jeremiah': 2}, {'healy jermiah': 1}, {'f healy jeremiah': 1}, {'f healy jeremiah': 1}, {'f healy jeremiah': 1}, {'healy jeremiah': 1}, {'healy jeremiah': 1}, {'healy jeremiah': 1}]
Possible candidate: [{'healy jeremiah': 79}]
lengthNecessary: 20.200000000000003
[{'healy jeremiah': 79}]
['healy jeremiah'] VS true_author: ['healy jeremiah']
ISBN: 052881821X
true author: Dedmon Emmett
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06088399887084961
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0017390251159667969
Discarted candidate: [{'bennett charles': 3}, {'author photographs the': 1, 'dedmon e': 1

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.138901948928833
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0075566768646240234
Discarted candidate: [{'lee trevino': 1}, {'blair sam': 1}, {'lee trevino': 1}]
Possible candidate: [{'lee trevino': 22}, {'blair sam': 20}]
lengthNecessary: 9.0
[{'lee trevino': 22}, {'blair sam': 20}]
['lee trevino', 'blair sam'] VS true_author: ['lee trevino', 'blair sam']
ISBN: 048642541X
true author: Dym Clive L.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.07121491432189941
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015177726745605469
Discarted candidate: [{'clive dym': 1}]
Possible candidate: [{'clive dym l': 13}]
lengthNecessary: 2.8000000000000003
[{'clive dym l': 13}]
['clive dym l'] VS true_author: ['clive dym l']
ISBN: 0070629218
true auth

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11113977432250977
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0043299198150634766
Discarted candidate: [{'john richardson': 4}, {'john richardson sir': 2}, {'foreword john richardson': 2}, {'sir': 1}]
Possible candidate: [{'"gillian newberry': 1, 'gillian newberry': 33}]
lengthNecessary: 8.6
[{'"gillian newberry': 1, 'gillian newberry': 33}]
['gillian newberry'] VS true_author: ['gillian newberry']
ISBN: 0824786157
true author: Yalkowsky Samuel H.,Banerjee Sujit
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04745912551879883
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0009608268737792969
Discarted candidate: []
Possible candidate: [{'banerjee sujit': 4, 'h samuel yalkowsky': 5}]
lengthNecessary: 1.8
[{'banerjee sujit': 4, 'h samuel 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2148120403289795
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01579880714416504
Discarted candidate: [{'a hassett kevin': 18}, {'glassma': 1, 'kassett': 1}, {'glassman': 1}, {'a hassett kevin': 1}, {'a hassett kevin': 1}, {'a hassett kevin': 1}, {'a hassett kevin': 1}]
Possible candidate: [{'glassman james': 28}, {'hassett kevin': 25}, {'glassman james k': 23}]
lengthNecessary: 20.200000000000003
[{'glassman james': 28}, {'hassett kevin': 25}, {'glassman james k': 23}]
['glassman james', 'hassett kevin', 'glassman james k'] VS true_author: ['glassman james k', 'hassett kevin']
ISBN: 0123745500
true author: Isaacs I. Martin
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08072280883789062
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.28190112113952637
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.028149127960205078
Discarted candidate: [{'simon wincester': 1}, {'simon winchester': 1}, {'simon winchester': 1}, {'simon winchester': 1}, {'simon winchester': 1}, {'simon winchester': 1}, {'simon winchester': 1}, {'simon winchester': 1}, {'simon winchester': 1}]
Possible candidate: [{'simon winchester': 119}]
lengthNecessary: 25.6
[{'simon winchester': 119}]
['simon winchester'] VS true_author: ['simon winchester']
ISBN: 1580931049
true author: Frick Symington Sanger Martha
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08378911018371582
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0017442703247070312
Discarted candidate: [{'garrett wendell': 1}]
Possible candidate: [{'f

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06147503852844238
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0012488365173339844
Discarted candidate: [{'brandt edgar joan kahr': 1, 'brandt joan kahr': 1}]
Possible candidate: [{'joan kahr': 16}]
lengthNecessary: 3.6
[{'joan kahr': 16}]
['joan kahr'] VS true_author: ['joan kahr']
ISBN: 0449210294
true author: MacKeever Maggie
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.04172396659851074
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.00145721435546875
Discarted candidate: [{'by mackeever maggie': 1}]
Possible candidate: [{'mackeever maggie': 12}]
lengthNecessary: 2.6
[{'mackeever maggie': 12}]
['mackeever maggie'] VS true_author: ['mackeever maggie']
ISBN: 0006165915
true author: Campbell Ramsey
embedding_type: inferSent
attributes_

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19568991661071777
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.010100841522216797
Discarted candidate: [{'gaines s steven': 5}, {'gaines steven': 2}, {'gaines stephen': 1}, {'gaines steven': 1}, {'gaines steven': 1}, {'gaines steven': 1}, {'gaines s steven': 1}, {'gaines steven': 1}]
Possible candidate: [{'gaines steven': 73}]
lengthNecessary: 17.2
[{'gaines steven': 73}]
['gaines steven'] VS true_author: ['gaines steven']
ISBN: 0891071806
true author: Siegel Robert
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05594778060913086
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015454292297363281
Discarted candidate: [{'kurt mitchell': 3}]
Possible candidate: [{'robert siegel': 17}]
lengthNecessary: 4.0
[{'robert siegel': 17}]
['robert si

Blocking time is: 0.015556097030639648
Discarted candidate: [{'walter': 1, 'walter wangerin': 13}, {'jr': 5, 'jr wangerin': 1}, {'walter wangerin': 1}, {'walter wangerin': 1}, {'walter wangerin': 1}, {'walter wangerin': 1}, {'jr walter wangerin': 1}]
Possible candidate: [{'jr walter wangerin': 52}]
lengthNecessary: 15.4
[{'jr walter wangerin': 52}]
['jr walter wangerin'] VS true_author: ['jr walter wangerin']
ISBN: 0521619106
true author: Pollack Henry N.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.09712409973144531
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 3
Blocking time is: 0.0014238357543945312
Discarted candidate: [{'h n pollack': 2}, {'henry n pollack': 2}]
Possible candidate: [{'henry n pollack': 19}]
lengthNecessary: 4.6000000000000005
[{'henry n pollack': 19}]
['henry n pollack'] VS true_author: ['henry n pollack']
ISBN: 0521362172
true author: Kent Susan
embedding_type: inferSent
attribute

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08335399627685547
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.0033388137817382812
Discarted candidate: [{'oliver r': 1}]
Possible candidate: [{'allen george': 14}, {'allen gerald': 10}, {'oliver richard': 9}]
lengthNecessary: 6.800000000000001
[{'allen george': 14}, {'allen gerald': 10}, {'oliver richard': 9}]
['allen george', 'allen gerald', 'oliver richard'] VS true_author: ['allen gerald', 'oliver richard']
ISBN: 0273703692
true author: Weetman Pauline
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06552505493164062
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0015790462493896484
Discarted candidate: []
Possible candidate: [{'pauline weetman': 11}, {'pauline prof weetman': 3}]
lengthNecessary: 2.8000000000000003
[{'pauline weetman'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1959068775177002
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.03703188896179199
Discarted candidate: [{'joe nocera': 2}, {'bethany mclean': 1}, {'bethany mclean': 1}, {'bethany mclean': 1}, {'bethany mclean': 1}, {'bethany mclean': 1}, {'bethany mclean': 1}, {'bethany mclean': 1}]
Possible candidate: [{'bethany mclean': 56}, {'joe nocera': 46}]
lengthNecessary: 22.200000000000003
[{'bethany mclean': 56}, {'joe nocera': 46}]
['bethany mclean', 'joe nocera'] VS true_author: ['bethany mclean', 'joe nocera']
ISBN: 142212584X
true author: Harris Ethan S.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.10365605354309082
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.003422975540161133
Discarted candidate: [{'es harris': 3}, {'es harris': 2}, {

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.15737080574035645
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008353948593139648
Discarted candidate: [{'davis n z': 2}, {'collectif': 1}, {'davis': 1}, {'davis natalie': 1}, {'davis natalie zemon': 1}, {'davis natalie zemon': 1}, {'davis natalie zemon': 1}]
Possible candidate: [{'davis natalie': 1, 'davis natalie zemon': 71}]
lengthNecessary: 16.0
[{'davis natalie': 1, 'davis natalie zemon': 71}]
['davis natalie zemon'] VS true_author: ['davis natalie zemon']
ISBN: 0425262308
true author: Clancy Tom,Greaney Mark
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.16343188285827637
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015561342239379883
Discarted candidate: [{'greaney mark': 2}, {'clancy greaney': 1}, {'tom': 1}, {'greaney mark': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06673526763916016
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.003981113433837891
Discarted candidate: [{'k nair': 1}, {'keshavan nair': 1}, {'keshavan nair': 1}, {'keshavan nair': 1}]
Possible candidate: [{'keshavan nair': 44, 'nair': 1}]
lengthNecessary: 9.8
[{'keshavan nair': 44, 'nair': 1}]
['keshavan nair'] VS true_author: ['keshavan nair']
ISBN: 0415422051
true author: Emmerson Richard K.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08710193634033203
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0035431385040283203
Discarted candidate: [{'clayton-emmerson sandra': 4}, {'clayton-emmerson sandra': 2}, {'clayton-emmerson eds sandra': 1}, {'emmerson k richard': 1}]
Possible candidate: [{'emmerson k richard': 39}]
lengthNecessary: 9.

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.06821870803833008
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 5
Blocking time is: 0.0038709640502929688
Discarted candidate: [{'iii kiechel walter': 7}, {'kiechel w': 4}, {'kiechel w': 1}, {'kiechel walter': 1}]
Possible candidate: [{'kiechel walter': 29, 'walter': 1}]
lengthNecessary: 8.6
[{'kiechel walter': 29, 'walter': 1}]
['kiechel walter'] VS true_author: ['iii kiechel walter']
ISBN: 0733306195
true author: Dickson Wright Clarissa,Paterson Jennifer
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05429410934448242
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.00125885009765625
Discarted candidate: [{'clarissa dickson wright': 3}]
Possible candidate: [{'clarissa dickson-wright': 3, 'dickson-wright': 2, 'dickson-wright paterson': 5, 'jennifer paterson': 3

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.035894155502319336
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 1
Blocking time is: 0.0011110305786132812
Discarted candidate: []
Possible candidate: [{'clifford john mortimer': 1, 'john mortimer': 2}]
lengthNecessary: 0.6000000000000001
[{'clifford john mortimer': 1, 'john mortimer': 2}]
['john mortimer'] VS true_author: ['john mortimer']
ISBN: 0262122995
true author: Lyson Thomas A.,Stevenson G. W.,Welsh Rick
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.05456209182739258
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.001771688461303711
Discarted candidate: []
Possible candidate: [{'a lyson thomas': 7}, {'g stevenson w': 3, 'mit press the': 1, 'rick welsh': 3}]
lengthNecessary: 2.8000000000000003
[{'a lyson thomas': 7}, {'g stevenson w': 3, 'mit press the'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.08286118507385254
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 4
Blocking time is: 0.002473115921020508
Discarted candidate: [{'carlson melody': 1}, {'a carlson melody': 1}]
Possible candidate: [{'a carlson melody': 26}, {'carlson melody': 9}]
lengthNecessary: 7.4
[{'a carlson melody': 26}, {'carlson melody': 9}]
['a carlson melody', 'carlson melody'] VS true_author: ['carlson melody']
ISBN: 0297646281
true author: Nuland Sherwin B.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.043753862380981445
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 2
Blocking time is: 0.0012369155883789062
Discarted candidate: [{'da leonardo vinci': 1}]
Possible candidate: [{'b nuland sherwin': 8, 'nuland sherwin': 5}]
lengthNecessary: 2.8000000000000003
[{'b nuland sherwin': 8, 'nuland sherwin': 5}]
[

Blocking time is: 0.015279769897460938
Discarted candidate: [{'cuddihy jane mary': 1, 'mary p': 1}, {'cuddihy john murray': 1, 'f john murray': 1}, {'clendenin j ryan': 1, 'j lannan patrick': 1}, {'fr regis ryan': 1}, {'alison murray': 1}, {'charlotte harrris mcdonald': 1}, {'design dunbar patricia': 1}, {'donald marshall w': 1}, {'cuddihy de harriet haven': 1}]
Possible candidate: [{'birmingham stephen': 86}]
lengthNecessary: 19.6
[{'birmingham stephen': 86}]
['birmingham stephen'] VS true_author: ['birmingham stephen']
ISBN: 0060112980
true author: Ford Betty
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.24315500259399414
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.022741079330444336
Discarted candidate: [{'betty ford': 2}, {'betty chase ford~chris': 1}, {'betty ford': 1}, {'betty ford': 1}, {'betty ford': 1}, {'betty ford': 1}, {'betty ford': 1}, {'betty ford': 1}]
Possible can

Blocking time is: 0.011164188385009766
Discarted candidate: [{'bienvenu marcelle': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}, {'emeril lagasse': 1}]
Possible candidate: [{'emeril lagasse': 73}]
lengthNecessary: 16.0
[{'emeril lagasse': 73}]
['emeril lagasse'] VS true_author: ['emeril lagasse']
ISBN: 006018650X
true author: Taylor Bradford Barbara
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2217710018157959
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.010888814926147461
Discarted candidate: [{'barbara bradford taylor': 2}, {'barbera bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1}, {'barbara bradford taylor': 1}]
Possible candidate: [{'barbara b

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.40414905548095703
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.03664112091064453
Discarted candidate: [{'leigh richard': 2}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}, {'baigent michael': 1}]
Possible candidate: [{'baigent michael': 81}]
lengthNecessary: 18.2
[{'baigent michael': 81}]
['baigent michael'] VS true_author: ['baigent michael']
ISBN: 0060892579
true author: Albright Madeleine
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 1.2028987407684326
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.11133313179016113
Discarted candidate: [{'bill woodward': 31}, {'william woodward': 25}, {'albright k madeleine': 12},

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.18132686614990234
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.015137672424316406
Discarted candidate: [{'bryan bulfinch compiled holme thomas': 4}, {'campbell joseph': 4}, {'bryan hulme': 1}, {'christopher holme': 1}, {'bulfinch thomas': 1}, {'bulfinch thomas': 1}, {'bulfinch thomas': 1}, {'bulfinch thomas': 1}]
Possible candidate: [{'bulfinch thomas': 59}, {'bryan holme': 31}]
lengthNecessary: 20.8
[{'bulfinch thomas': 59}, {'bryan holme': 31}]
['bulfinch thomas', 'bryan holme'] VS true_author: ['bulfinch thomas', 'bryan holme']
ISBN: 0140092501
true author: Gleick James
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17555785179138184
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.017663955688476562
Discarted candidate: [{'gleick jam

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.32550907135009766
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.07756996154785156
Discarted candidate: [{'studios': 1}, {'david guterson pictures universal': 1}, {'jr': 1}, {'f guste roy': 1}, {'david guterson': 1}, {'d guterson': 1}, {'d guterson': 1}, {'david guterson': 1}, {'david guterson': 1}]
Possible candidate: [{'david guterson': 241}]
lengthNecessary: 50.0
[{'david guterson': 241}]
['david guterson'] VS true_author: ['david guterson']
ISBN: 0151005346
true author: Reverte Perez Arturo
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.6530389785766602
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.11083793640136719
Discarted candidate: [{'margaret peden sayers': 56}, {'arturo p rez-reverte': 35}, {'margaret peden': 8}, {'margaret s

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2938418388366699
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.025882959365844727
Discarted candidate: [{'venturi': 3}, {'br denise scott': 1}, {'venturi': 1}, {'venturi': 1}, {'brown izenourdenise robert scott venturisteven': 1}, {'venturi': 1}, {'robert venturi': 1}]
Possible candidate: [{'izenour robert venturi': 3, 'robert venturi': 55}, {'azenour steven': 1, 'izenour steven': 41}, {'brown denise scott': 39}]
lengthNecessary: 29.6
[{'izenour robert venturi': 3, 'robert venturi': 55}, {'azenour steven': 1, 'izenour steven': 41}, {'brown denise scott': 39}]
['robert venturi', 'izenour steven', 'brown denise scott'] VS true_author: ['robert venturi', 'brown denise scott', 'izenour steven']
ISBN: 0300044402
true author: Saggs W. F. H.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding tim

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.4725830554962158
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.057787179946899414
Discarted candidate: [{'meyer stephanie': 6}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}, {'meyer stephenie': 1}]
Possible candidate: [{'meyer stephenie': 190}]
lengthNecessary: 40.800000000000004
[{'meyer stephenie': 190}]
['meyer stephenie'] VS true_author: ['meyer stephenie']
ISBN: 0316109304
true author: Bronowski J.
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.20181775093078613
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01760101318359375
Discarted candidate: [{'bronowski j': 1}, {'bronowski jacob': 1}, {'bronowski j': 1}, {

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.25290393829345703
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.016777992248535156
Discarted candidate: [{'jacket keith parkinson': 1}, {'art': 1}, {'feinman jeffrey': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}, {'brooks terry': 1}]
Possible candidate: [{'brooks terry': 107}]
lengthNecessary: 23.200000000000003
[{'brooks terry': 107}]
['brooks terry'] VS true_author: ['brooks terry']
ISBN: 0345371984
true author: Adams Douglas,Carwardine Mark
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1641228199005127
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.017355918884277344
Discarted candidate: [{'adams': 5}, {'carwardine mark': 2}, {'carwardine mark': 1}, {'carwardine mark': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.22502803802490234
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.010222196578979492
Discarted candidate: [{'b greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}, {'brian greene': 1}]
Possible candidate: [{'brian greene': 83}]
lengthNecessary: 18.400000000000002
[{'brian greene': 83}]
['brian greene'] VS true_author: ['brian greene']
ISBN: 0375414967
true author: Russo Richard
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.24178099632263184
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.020340919494628906
Discarted candidate: [{'richard russo': 2}, {'r russo': 1}, {'richard russo': 1}, {'richard russo': 1}, {'richard russo': 1}, {'r

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.26174330711364746
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.04919290542602539
Discarted candidate: [{'marian schwartz': 12}, {'edward radzinsky': 2}, {'clifford dowdey': 2}, {'edvard radzinsky': 2}, {'marian schwartz transl': 1}, {'photos': 1}, {'edvard marian radzinsky schwartz': 1}, {'edvard radzinsky w': 1}, {'marian schwartz trans': 1}]
Possible candidate: [{'edvard radzinskii': 4, 'edvard radzinsky': 103}]
lengthNecessary: 26.0
[{'edvard radzinskii': 4, 'edvard radzinsky': 103}]
['edvard radzinsky'] VS true_author: ['edvard radzinsky']
ISBN: 0385425473
true author: Chang Jung
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3053290843963623
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.017189979553222656
Discarted candidate: [{'

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5374689102172852
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.043044090270996094
Discarted candidate: [{'a rice': 6}, {'anne rice': 2}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}, {'anne rice': 1}]
Possible candidate: [{'anne rice': 123}]
lengthNecessary: 27.6
[{'anne rice': 123}]
['anne rice'] VS true_author: ['anne rice']
ISBN: 0394502787
true author: Pagels Elaine
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2904818058013916
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.00716090202331543
Discarted candidate: [{'elaine h pagels': 9}, {'elaine pagels': 4}, {'elaine pagels': 3}, {'elaine h pagels': 2}, {'elaine pagels': 1}, {'elaine pagels': 1}, {'elaine pagels': 1}]
Pos

Blocking time is: 0.2850217819213867
Discarted candidate: [{'rosalynn': 53}, {'cartere jimmy': 2, 'jimmy': 15}, {'crater jimmy': 2}, {'rosalynn': 1}, {'rosalynn': 1}, {'rosalynn': 1}, {'rosalynn': 1}, {'rosalynn y': 1}]
Possible candidate: [{'carter jimmy': 228}, {'*signed carter rosalynn': 2, 'carter rosalynn': 162}]
lengthNecessary: 93.80000000000001
[{'carter jimmy': 228}, {'*signed carter rosalynn': 2, 'carter rosalynn': 162}]
['carter jimmy', 'carter rosalynn'] VS true_author: ['carter jimmy', 'carter rosalynn']
ISBN: 0394561236
true author: Gore Vidal
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.37839198112487793
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.018491744995117188
Discarted candidate: [{'box edgar': 2}, {'gore vidal': 1}, {'box edgar': 1}, {'box edgar': 1}, {'box edgar': 1}, {'box edgar': 1}, {'j robert stanton': 1}, {'box edgar': 1}, {'eric lustbader van': 1}]
P

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5502970218658447
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.1016991138458252
Discarted candidate: [{'heat moon': 29}, {'heat l moon william': 2, 'heat least moon william': 9}, {'heat-moon least': 5}, {'heat-moon': 4}, {'white': 3}, {'black photographs': 3}, {'e i trogdon william': 2}, {'hank stuever': 2}, {'heat-moon least wm': 1}]
Possible candidate: [{'heat-moon least william': 211, 'least william': 29}]
lengthNecessary: 60.0
[{'heat-moon least william': 211, 'least william': 29}]
['heat-moon least william'] VS true_author: ['heat-moon least william']
ISBN: 0395488842
true author: Harrison Jim
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1522989273071289
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.008035659790039062
Discarted c

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1969749927520752
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014251947402954102
Discarted candidate: [{'carol colman': 19}, {'gary heaven': 1}, {'gary heavin': 1}, {'gary heavin': 1}, {'carol colman': 1}, {'gary heavin': 1}, {'gary heavin': 1}, {'gary heavin': 1}, {'gary heavin': 1}]
Possible candidate: [{'gary heavin': 70}]
lengthNecessary: 19.400000000000002
[{'gary heavin': 70}]
['gary heavin'] VS true_author: ['gary heavin', 'carol colman']
ISBN: 0399157824
true author: Cussler Clive,Brown Graham
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.35231781005859375
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.027640104293823242
Discarted candidate: [{'brown graham': 4}, {'clive cussler': 2}, {'brown graham': 1}, {'adventure austin ku

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2908201217651367
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.033953189849853516
Discarted candidate: [{'collectif': 2}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}, {'briggs patricia': 1}]
Possible candidate: [{'briggs patricia': 156}]
lengthNecessary: 33.2
[{'briggs patricia': 156}]
['briggs patricia'] VS true_author: ['briggs patricia']
ISBN: 0446387878
true author: Dorris Michael
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19091486930847168
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.020595312118530273
Discarted candidate: [{'dorris michael': 2}, {'dorris morris': 1}, {'dorris michael': 1}, {'dorris micha

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2052009105682373
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.011354923248291016
Discarted candidate: [{'hawking stephen': 7}, {'krauss lawrence': 3}, {'foreword hawking stephen': 2}, {'krauss': 1}, {'albee edward': 1}, {'krauss lawrence m w': 1}, {'m': 1}, {'foreword': 1}]
Possible candidate: [{'krauss lawrence m': 72}]
lengthNecessary: 17.8
[{'krauss lawrence m': 72}]
['krauss lawrence m'] VS true_author: ['krauss lawrence m']
ISBN: 051511779X
true author: Roberts Nora
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.15110516548156738
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.011143922805786133
Discarted candidate: [{'noraauthor roberts': 1}, {'nora roberts': 1}, {'nora roberts': 1}, {'nora roberts': 1}, {'nora roberts': 1}, {'nora

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.617699146270752
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.15465188026428223
Discarted candidate: [{'a iacocca lee': 29}, {'a et iacocca lee novak william': 2}, {'iacocca lee w': 2}, {'novak wm': 2}, {'iacocca l': 1}, {'iacocca l': 1}, {'iacocca lee': 1}, {'iacocca lee': 1}]
Possible candidate: [{'iacocca lee': 153}, {'novak william': 60}]
lengthNecessary: 50.400000000000006
[{'iacocca lee': 153}, {'novak william': 60}]
['iacocca lee', 'novak william'] VS true_author: ['iacocca lee']
ISBN: 0553051253
true author: Benford Gregory,Brin David
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2538177967071533
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02053666114807129
Discarted candidate: [{'ad benford brin david gregory': 1}, {'brin d

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.13276314735412598
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01566600799560547
Discarted candidate: [{'larty mc': 1}, {'**debut *s-p-e-c-t-u-l-a-r novel ron': 1}, {'mclarty ron': 1}, {'mclarty ron': 1}, {'mclarty ron': 1}, {'mclarty ron': 1}, {'mclarty ron': 1}, {'mclarty ron': 1}, {'mclarty ron': 1}]
Possible candidate: [{'mclarty ron': 107}]
lengthNecessary: 23.200000000000003
[{'mclarty ron': 107}]
['mclarty ron'] VS true_author: ['mclarty ron']
ISBN: 0670036781
true author: Madonna 
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.2165529727935791
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.01941990852355957
Discarted candidate: [{'fulrimari jeffrey': 2, 'fulvimari jeffrey': 10}, {'fulrimari jeffrey madonna': 4, 'fulvimari jeffr

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.24170494079589844
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.011019706726074219
Discarted candidate: [{'boyle coraghessan t': 2}, {'coraghessan': 1}, {'c': 1}, {'boyle c t': 1}, {'boyd malcolm': 1}, {'boyle c t': 1}, {'boyle c t': 1}]
Possible candidate: [{'boyle c t': 62}, {'boyle coraghessan t': 18, 'boyle t': 1}]
lengthNecessary: 17.8
[{'boyle c t': 62}, {'boyle coraghessan t': 18, 'boyle t': 1}]
['boyle c t', 'boyle coraghessan t'] VS true_author: ['boyle c t']
ISBN: 0670891916
true author: Bradford Sarah
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17399907112121582
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.013316869735717773
Discarted candidate: [{'bradford sarah': 2}, {'kennedy': 1}, {'jacqueline onassis': 1}, {'bradford 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.6015849113464355
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.10840773582458496
Discarted candidate: [{'collier': 2}, {'horowitz peter': 1}, {'collier horo': 1}, {'peter': 1}, {'h perkin': 1}, {'collier peter': 1}, {'collier peter': 1}, {'horowitz': 1}]
Possible candidate: [{'collier peter': 110}, {'david horowitz': 101}]
lengthNecessary: 44.0
[{'collier peter': 110}, {'david horowitz': 101}]
['collier peter', 'david horowitz'] VS true_author: ['collier peter', 'david horowitz']
ISBN: 0671622617
true author: Prager Dennis,Telushkin Joseph
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.42129015922546387
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.03620600700378418
Discarted candidate: [{'joseph telushkin': 2}, {'joseph rabbi telushki

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.47080516815185547
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.02079010009765625
Discarted candidate: [{'chang jung': 1}, {'halliday jon': 1}, {'chang jung': 1}, {'halliday jon': 1}, {'chang jung': 1}, {'halliday jon': 1}, {'chang jung': 1}, {'halliday jon': 1}]
Possible candidate: [{'chang jung': 65}, {'halliday jon': 56}]
lengthNecessary: 25.8
[{'chang jung': 65}, {'halliday jon': 56}]
['chang jung', 'halliday jon'] VS true_author: ['chang jung', 'halliday jon']
ISBN: 0679425411
true author: Shaara Michael
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.11033868789672852
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.006414175033569336
Discarted candidate: [{'michael shaara': 4}, {'michael shaara': 1}, {'bob loomis': 1}, {'shaara': 1},

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1721940040588379
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014345884323120117
Discarted candidate: [{'ford richard': 2}, {'ford g m': 1}, {'ford richard': 1}, {'ford richard': 1}, {'ford richard': 1}, {'ford richard': 1}, {'ford richard': 1}, {'ford richard': 1}, {'ford richard': 1}]
Possible candidate: [{'ford richard': 101}]
lengthNecessary: 22.200000000000003
[{'ford richard': 101}]
['ford richard'] VS true_author: ['ford richard']
ISBN: 0679736336
true author: Ker Conway Jill
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.498276948928833
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.009099721908569336
Discarted candidate: [{'conway jill': 1, 'conway jill k': 1, 'conway jill kathryn': 1, 'conway jill kerr': 2}, {'jill ker': 1, 'k

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.1504230499267578
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.007016897201538086
Discarted candidate: [{'conant jennet': 6}, {'conant jennet richards': 2}, {'conant jennet': 1}, {'conant': 1}, {'conant jennet': 1}, {'conant jennet': 1}, {'conant jennet': 1}]
Possible candidate: [{'conant jennet': 59}]
lengthNecessary: 14.4
[{'conant jennet': 59}]
['conant jennet'] VS true_author: ['conant jennet']
ISBN: 0688040330
true author: Bush Barbara
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.49370813369750977
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.06150388717651367
Discarted candidate: [{'bush k mildred': 8}, {'drew lisa': 6}, {'bush kerr mildred': 4}, {'as barbar bush dictated millie to': 2, 'as barbara bush dictated millie to': 2}, 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.41927504539489746
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009789228439331055
Discarted candidate: [{'brown sandra': 2}, {'fleming ian': 1}, {'brown sandra': 1}, {'brown sandra': 1}, {'brown sandra': 1}, {'brown sandra': 1}, {'brown sandra': 1}, {'brown sandra': 1}]
Possible candidate: [{'brown sandra': 81}]
lengthNecessary: 18.0
[{'brown sandra': 81}]
['brown sandra'] VS true_author: ['brown sandra']
ISBN: 0743249291
true author: Gregory Philippa
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.13765287399291992
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.009931802749633789
Discarted candidate: [{'gregory philippa': 2}, {'gregory': 1}, {'gregory philippa': 1}, {'gregory philippa': 1}, {'gregory philippa': 1}, {'gregory philippa': 1

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.27372217178344727
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.026553869247436523
Discarted candidate: [{'steve stone': 3}, {'anderson brian herbert': 1}, {'j kevin steve stone': 1}, {'anderson j kevin': 1}, {'anderson j kevin': 1}, {'anderson j kevin': 1}, {'anderson j kevin': 1}, {'anderson j kevin': 1}]
Possible candidate: [{'brian herbert': 77}, {'anderson j kevin': 65}]
lengthNecessary: 30.400000000000002
[{'brian herbert': 77}, {'anderson j kevin': 65}]
['brian herbert', 'anderson j kevin'] VS true_author: ['brian herbert', 'anderson j kevin']
ISBN: 0778312518
true author: Macomber Debbie
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12135910987854004
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.008157968521118164
Discarted can

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19592499732971191
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.014837026596069336
Discarted candidate: [{'kate moloney': 19}, {'gunnkate moloney tim': 1}, {'kate maloney': 1}, {'kate maloney': 1}, {'kate maloney': 1}, {'kate maloney': 1}, {'kate maloney': 1}, {'kate maloney': 1}]
Possible candidate: [{'gunn tim': 64}, {'kate maloney': 24}]
lengthNecessary: 22.8
[{'gunn tim': 64}, {'kate maloney': 24}]
['gunn tim', 'kate maloney'] VS true_author: ['gunn tim', 'kate maloney']
ISBN: 0812517725
true author: Jordan Robert
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.5482649803161621
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.03244185447692871
Discarted candidate: [{'of professor studies theatre': 2}, {'great hunt the': 1}, {'jordan ro

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.17471599578857422
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 9
Blocking time is: 0.009540081024169922
Discarted candidate: [{'carl foreword gorman': 1, 'carl gorman': 6}, {'benis frank m': 3}, {'kanji kawano': 3}, {'k kawano': 1, 'kawano': 2}, {'benis frank intro m usmc': 1}, {'code talker': 1}, {'kawano kenji w': 1}, {'foreword-carl gorman': 1}]
Possible candidate: [{'kawano kenji': 69, 'kenji': 1}]
lengthNecessary: 18.0
[{'kawano kenji': 69, 'kenji': 1}]
['kawano kenji'] VS true_author: ['kawano kenji']
ISBN: 0874744350
true author: Fitzhugh William W.,Crowell Aron
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.3943939208984375
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.06103205680847168
Discarted candidate: [{'a arutiunov s': 1, 'dzeniskevich g i': 

embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.13111209869384766
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.006963968276977539
Discarted candidate: [{'bianchi john': 4}, {'dickinson terrence': 4}, {'dickinson terence': 1}, {'dickinson terence': 1}, {'dickinson terence': 1}, {'dickinson terence': 1}, {'dickinson terence': 1}]
Possible candidate: [{'dickinson terence': 60}]
lengthNecessary: 14.600000000000001
[{'dickinson terence': 60}]
['dickinson terence'] VS true_author: ['dickinson terence']
ISBN: 1400052580
true author: De Laurentiis Giada
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.19364213943481445
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 10
Blocking time is: 0.011727094650268555
Discarted candidate: [{'pearson victoria': 2}, {'batali mario': 2}, {'batalli mario': 2}, {'de giad laurentiis'

Blocking time is: 0.011766195297241211
Discarted candidate: [{'contributor-eddie muller': 1}, {'eddie mullier': 1}, {'huhter tab': 1}, {'hunter tab w': 1}, {'hunter tab': 1}, {'hunter tab': 1}, {'hunter tab': 1}, {'hunter tab': 1}]
Possible candidate: [{'hunter tab': 65}, {'eddie muller': 28}]
lengthNecessary: 20.200000000000003
[{'hunter tab': 65}, {'eddie muller': 28}]
['hunter tab', 'eddie muller'] VS true_author: ['hunter tab', 'eddie muller']
ISBN: 1577192761
true author: Simmons Richard
embedding_type: inferSent
attributes_list: ['author']
model_type: bilstm
char_level: False
Embedding time is: 0.12166118621826172
cluster_method: hierarchy
num_clusters_rate: 0.1
NUM_CLUSTERS 8
Blocking time is: 0.00782918930053711
Discarted candidate: [{'david icketts': 1}, {'richard simmons': 1}, {'richard simmons': 1}, {'richard simmons': 1}, {'richard simmons': 1}, {'richard simmons': 1}, {'richard simmons': 1}]
Possible candidate: [{'richard simmons': 67}]
lengthNecessary: 14.8
[{'richard sim

In [7]:
from evaluation import *

In [13]:
getEvaluation(finalAuthors, trueAuthors, 1)

precision is 0.8682295877122069
recall is 0.9597855227882037
f1Score is 0.9117147707979626


(0.8682295877122069, 0.9597855227882037, 0.9117147707979626)

In [8]:
getEvaluation(finalAuthors, trueAuthors, 1)

precision is 0.9014567266495287
recall is 0.9401251117068812
f1Score is 0.9203849518810149


(0.9014567266495287, 0.9401251117068812, 0.9203849518810149)