In [1]:
import sys
sys.path.append('../src/mane/prototype/')
import numpy as np
import graph as g
import pickle as p

from sklearn.preprocessing import normalize, scale
from sklearn.metrics import f1_score
from sklearn.multiclass import OneVsRestClassifier
from sklearn.svm import LinearSVC
from sklearn.linear_model import LogisticRegression

In [65]:
def lg(exp_id, graph_name, index=[0], norm=False, split=0.5, max_iter=100, C=1e9, ic=500):
    weightfile = '../src/mane/prototype/embeddings/' + exp_id + '.weights'
    graphfile = '../src/mane/data/' + graph_name
    with open(weightfile, 'rb') as f:
        w = p.load(f)
    graph = g.graph_from_pickle(graphfile+'.graph', graphfile+'.community')
    emb = None
    if index is None:
        emb = w
    else:
        for i in index:
            if emb is None:
                emb = w[i]
            else:
                emb += w[i]
        emb /= len(index)
    if norm:
        emb = normalize(emb)
    xids, y_train = graph.gen_community(split)
    X = [emb[i] for i in xids]
    predictor = LogisticRegression(C=C, max_iter=max_iter, 
                                   n_jobs=-1, intercept_scaling=ic).fit(X, y_train)
    y_true = [graph._communities[i] for i in graph.nodes()]
    y_pred = [predictor.predict(emb[i].reshape(1,-1))[0] for i in graph.nodes()]
    print('Experiment ', exp_id, ' ', graph_name)
    print('f1_macro (emb): ', f1_score(y_true, y_pred, average='macro'))
    print('f1_micro (emb): ', f1_score(y_true, y_pred, average='micro'))
    return y_true, y_pred, emb, predictor, xids, y_train, graph

In [9]:
lg_average('BC3021', 'blogcatalog3')

Experiment  BC3021   blogcatalog3
f1_macro (avg):  0.00484540632064
f1_micro (avg):  0.104344453064


  'precision', 'predicted', average, warn_for)


In [10]:
lg_all('BC3021', 'blogcatalog3')

Experiment  BC3021   blogcatalog3
f1_macro (avg):  0.00598011775139
f1_micro (avg):  0.104344453064


  'precision', 'predicted', average, warn_for)


In [11]:
lg_average('BC3023', 'blogcatalog3')

Experiment  BC3023   blogcatalog3
f1_macro (avg):  0.00484540632064
f1_micro (avg):  0.104344453064


  'precision', 'predicted', average, warn_for)


In [12]:
lg_all('BC3023', 'blogcatalog3')

Experiment  BC3023   blogcatalog3
f1_macro (avg):  0.00688194384949
f1_micro (avg):  0.104053529868


  'precision', 'predicted', average, warn_for)


In [15]:
lg_embeddings('BC3023', 'blogcatalog3')

Experiment  BC3023   blogcatalog3
f1_macro (emb):  0.00484540632064
f1_micro (emb):  0.104344453064


  'precision', 'predicted', average, warn_for)


In [14]:
lg_nce('BC3023', 'blogcatalog3')

Experiment  BC3023   blogcatalog3
f1_macro (emb):  0.0070864616913
f1_micro (emb):  0.104441427463


  'precision', 'predicted', average, warn_for)


In [20]:
for _ in range(10):
    lg_average('BC3003', 'blogcatalog3')

Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.116740845038
f1_micro (avg):  0.258921644686


  'precision', 'predicted', average, warn_for)


Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.115163291441
f1_micro (avg):  0.252036462374
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.119866603526
f1_micro (avg):  0.258145849496
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.115795405431
f1_micro (avg):  0.258436772692
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.115583902707
f1_micro (avg):  0.259697439876
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.114217090023
f1_micro (avg):  0.255236617533
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.115176455722
f1_micro (avg):  0.256206361521
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.109405997054
f1_micro (avg):  0.253588052754
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.118284651023
f1_micro (avg):  0.256691233514
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.117148492359
f1_micro (avg):  0.257951900698


In [24]:
for _ in range(10):
    lg_average('BC3003', 'blogcatalog3')

Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.114492865125
f1_micro (avg):  0.255527540729


  'precision', 'predicted', average, warn_for)


Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.118079182637
f1_micro (avg):  0.258242823894
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.114348160228
f1_micro (avg):  0.255527540729
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.114324856109
f1_micro (avg):  0.258242823894
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.113367693185
f1_micro (avg):  0.256303335919
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.112849965176
f1_micro (avg):  0.258339798293
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.114462702368
f1_micro (avg):  0.257660977502
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.112905631053
f1_micro (avg):  0.256691233514
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.115086471157
f1_micro (avg):  0.255721489527
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.112165410078
f1_micro (avg):  0.254751745539


In [25]:
for _ in range(10):
    lg_embeddings('BC3003', 'blogcatalog3')

Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0897211308695
f1_micro (emb):  0.230217222653


  'precision', 'predicted', average, warn_for)


Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0880587371365
f1_micro (emb):  0.230799069046
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0899957295453
f1_micro (emb):  0.230605120248
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0872543169001
f1_micro (emb):  0.227986811482
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.08967709717
f1_micro (emb):  0.229829325058
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0848275240609
f1_micro (emb):  0.228568657874
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0912150848083
f1_micro (emb):  0.233320403413
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.086548012115
f1_micro (emb):  0.229926299457
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0893675469702
f1_micro (emb):  0.234968968192
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.0861642632646
f1_micro (emb):  0.227792862684


In [27]:
# Without normalize
for _ in range(10):
    lg_embeddings('BC3003', 'blogcatalog3')

Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.134601815957
f1_micro (emb):  0.257467028704


  'precision', 'predicted', average, warn_for)


Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.141062522922
f1_micro (emb):  0.258339798293
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.140325718933
f1_micro (emb):  0.255139643134
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.134998919531
f1_micro (emb):  0.254751745539
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.139766097233
f1_micro (emb):  0.256691233514
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.136630917426
f1_micro (emb):  0.253297129558
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.135236987492
f1_micro (emb):  0.251842513576
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.137346870654
f1_micro (emb):  0.254266873545
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.134263648314
f1_micro (emb):  0.252618308766
Experiment  BC3003   blogcatalog3
f1_macro (emb):  0.144334557
f1_micro (emb):  0.259018619085


In [5]:
# Without normalize
for _ in range(10):
    lg_average('BC3024', 'blogcatalog3')

Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.123236708791
f1_micro (avg):  0.174941815361
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.119223817795
f1_micro (avg):  0.171353762607


  'precision', 'predicted', average, warn_for)


Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.12650246948
f1_micro (avg):  0.18046935609
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.126457555639
f1_micro (avg):  0.176784328937
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.128056499036
f1_micro (avg):  0.175620636152
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.136342409676
f1_micro (avg):  0.177075252133
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.119535319362
f1_micro (avg):  0.176493405741
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.118683102454
f1_micro (avg):  0.175523661753
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.136025498216
f1_micro (avg):  0.173487199379
Experiment  BC3024   blogcatalog3
f1_macro (avg):  0.132012225797
f1_micro (avg):  0.178529868115


In [15]:
# Test embedding from node2vec without normalize

exp_id = 'BC3_node2vec'
graph_name = 'blogcatalog3'
max_iter = 1000
portition = 0.5
weightfile = '../src/mane/prototype/embeddings/' + exp_id + '.weights'
graphfile = '../src/mane/data/' + graph_name
with open(weightfile, 'rb') as f:
    w = p.load(f)
graph = g.graph_from_pickle(graphfile+'.graph', graphfile+'.community')
wl = np.ndarray(shape=(10313,128), dtype=np.float32)
for i in graph.nodes():
    wl[i][:] = w[i]
e_norm = wl
xids, y_train = graph.gen_community(portition)
X = [e_norm[i] for i in xids]
#predictor = LogisticRegression(max_iter=max_iter, n_jobs=2).fit(X, y_train)
predictor = LogisticRegression(C=1e9, max_iter=max_iter, n_jobs=2).fit(X, y_train)
y_true = [graph._communities[i] for i in graph.nodes()]
y_pred = [predictor.predict(e_norm[i].reshape(1,-1))[0] for i in graph.nodes()]
print('Experiment ', exp_id, ' ', graph_name)
print('f1_macro (avg): ', f1_score(y_true, y_pred, average='macro'))
print('f1_micro (avg): ', f1_score(y_true, y_pred, average='micro'))

Experiment  BC3_node2vec   blogcatalog3
f1_macro (avg):  0.134333035066
f1_micro (avg):  0.127133436773


In [12]:
# With high regularization restriction
for _ in range(10):
    lg_average('BC3003', 'blogcatalog3')

Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.18885993527
f1_micro (avg):  0.264352211016


  'precision', 'predicted', average, warn_for)


Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.178624882281
f1_micro (avg):  0.263382467029
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.186790205747
f1_micro (avg):  0.269200930954
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.183781611367
f1_micro (avg):  0.270461598138
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.182875408714
f1_micro (avg):  0.264255236618
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.170921064814
f1_micro (avg):  0.262994569434
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.180035840937
f1_micro (avg):  0.266291698991
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.181679782199
f1_micro (avg):  0.268328161365
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.172461884888
f1_micro (avg):  0.260473235066
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.195330127801
f1_micro (avg):  0.266776570985


In [14]:
# Without high regularization restriction (maybe extreme overfit)
for _ in range(10):
    lg_average('BC3003', 'blogcatalog3')

Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.231464313831
f1_micro (avg):  0.269879751746
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.231905373246
f1_micro (avg):  0.26871605896
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.225459827678
f1_micro (avg):  0.26406128782
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.227966114565
f1_micro (avg):  0.263479441427
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.223431328045
f1_micro (avg):  0.26871605896
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.226662751553
f1_micro (avg):  0.261636927851
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.222029666086
f1_micro (avg):  0.26794026377
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.236412099949
f1_micro (avg):  0.268231186967
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.220325754334
f1_micro (avg):  0.26095810706
Experiment  BC3003   blogcatalog3
f1_macro (avg):  0.229073200321
f1_micro (avg):  0.267746314973


In [16]:
# Without high regularization
for _ in range(10):
    lg_embeddings('BC3_deepwalk', 'blogcatalog3')

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.176592490043
f1_micro (emb):  0.190942591156
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.168755210426
f1_micro (emb):  0.186675717611
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.165052734059
f1_micro (emb):  0.183669511249
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.170187811286
f1_micro (emb):  0.189584949573
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.169425552103
f1_micro (emb):  0.181536074476
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.160817582297
f1_micro (emb):  0.184639255237
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.168058670528
f1_micro (emb):  0.186772692009
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.172268980869
f1_micro (emb):  0.189487975175
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.174936647138
f1_micro (emb):  0.187257564003
Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.17518

In [18]:
# Without high regularization restriction (maybe extreme overfit)
for _ in range(10):
    lg_average('BC3012', 'blogcatalog3')

Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.230215879861
f1_micro (avg):  0.269976726144
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.240204737171
f1_micro (avg):  0.276474010861
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.237116080153
f1_micro (avg):  0.275116369279
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.229967973073
f1_micro (avg):  0.278510473235
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.227415752099
f1_micro (avg):  0.271819239721
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.231182872668
f1_micro (avg):  0.277637703646
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.235566378466
f1_micro (avg):  0.279965089216
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.234393485211
f1_micro (avg):  0.276667959659
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.23043577756
f1_micro (avg):  0.27889837083
Experiment  BC3012   blogcatalog3
f1_macro (avg):  0.236381520751
f1_micro (avg):  0.276183087665


In [12]:
# Normalization might increase ~1.5%
_ = lg('BC3_node2vec', 'blogcatalog3', None, True, C=1e10)

Experiment  BC3_node2vec   blogcatalog3
f1_macro (emb):  0.142211558894
f1_micro (emb):  0.138673390225


In [8]:
# C plays a big role in f1 score, bigger C is better (more overfit)
_ = lg('BC3_node2vec', 'blogcatalog3', None, C=1e10)

Experiment  BC3_node2vec   blogcatalog3
f1_macro (emb):  0.136424362427
f1_micro (emb):  0.127424359969


In [7]:
# C plays a big role in f1 score, larger C is better (more overfit) and take longer time.
_ = lg('BC3_node2vec', 'blogcatalog3', None, C=1e15)

Experiment  BC3_node2vec   blogcatalog3
f1_macro (emb):  0.139981239597
f1_micro (emb):  0.12577579519


In [59]:
# Increase ic for node2vec too, but no significant improvement.
_ = lg('BC3_node2vec', 'blogcatalog3', None, C=1e15, ic=20)

Experiment  BC3_node2vec   blogcatalog3
f1_macro (emb):  0.132168967917
f1_micro (emb):  0.12810318076


In [17]:
_ = lg('BC3_deepwalk', 'blogcatalog3')

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.159558442833
f1_micro (emb):  0.184154383243


In [18]:
_ = lg('BC3_deepwalk', 'blogcatalog3', C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.173899261504
f1_micro (emb):  0.187257564003


In [19]:
_ = lg('BC3_deepwalk', 'blogcatalog3', C=1e15)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.178525504103
f1_micro (emb):  0.188712179984


In [20]:
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e15)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.179359606732
f1_micro (emb):  0.185512024825


In [21]:
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e20)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.173694083412
f1_micro (emb):  0.185512024825


In [23]:
# Test increase intercept scaling (less regularization) = 1e10
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.00484540632064
f1_micro (emb):  0.104344453064


  'precision', 'predicted', average, warn_for)


In [25]:
# Test increase intercept scaling (less regularization) = 1e5
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.00484540632064
f1_micro (emb):  0.104344453064


  'precision', 'predicted', average, warn_for)


In [27]:
# Test increase intercept scaling (less regularization) = 1
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.179533339032
f1_micro (emb):  0.184736229635


In [29]:
# Test increase intercept scaling (less regularization) = 0.1
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.168065879964
f1_micro (emb):  0.18357253685


In [31]:
# Test increase intercept scaling (less regularization) = 5
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.180549583389
f1_micro (emb):  0.182311869666


In [33]:
# Test increase intercept scaling (less regularization) = 100
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.183072014513
f1_micro (emb):  0.190166795966


In [35]:
# Test increase intercept scaling (less regularization) = 1000
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.16228669375
f1_micro (emb):  0.170868890613


  'precision', 'predicted', average, warn_for)


In [37]:
# Test increase intercept scaling (less regularization) = 500
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10, ic=500)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.182358768162
f1_micro (emb):  0.183184639255


In [38]:
# Test increase intercept scaling (less regularization) = 200
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10, ic=200)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.19052928339
f1_micro (emb):  0.188906128782


In [39]:
# Test increase intercept scaling (less regularization) = 300
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10, ic=300)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.178623753489
f1_micro (emb):  0.185415050427


In [40]:
# Test increase intercept scaling (less regularization) = 250
_ = lg('BC3_deepwalk', 'blogcatalog3', norm=True, C=1e10, ic=250)

Experiment  BC3_deepwalk   blogcatalog3
f1_macro (emb):  0.186272138262
f1_micro (emb):  0.18589992242


In [41]:
# Test increase intercept scaling (less regularization) = 200
_ = lg('BC3012', 'blogcatalog3', norm=True, C=1e10, ic=200)

Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.209849459982
f1_micro (emb):  0.239429790535


In [42]:
# Test increase intercept scaling (less regularization) = 200
_ = lg('BC3012', 'blogcatalog3', index=[0,1], norm=True, C=1e10, ic=200)

Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.232876907793
f1_micro (emb):  0.27812257564


In [44]:
# Test increase intercept scaling (less regularization) = 200
_ = lg('BC3012', 'blogcatalog3', index=[0,1], norm=True, C=1e10, ic=220)

Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.233082461595
f1_micro (emb):  0.27967416602


In [46]:
# Note: This is still random walk
_ = lg('BC3025', 'blogcatalog3', index=[0,1], norm=True, C=1e10, ic=220)

Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.246718317201
f1_micro (emb):  0.282971295578


In [47]:
# Check result of ex24 with much less num_walk than 25
_ = lg('BC3024', 'blogcatalog3', index=[0,1], norm=True, C=1e10, ic=220)

Experiment  BC3024   blogcatalog3
f1_macro (emb):  0.165170496715
f1_micro (emb):  0.175426687355


In [61]:
for _ in range(10):
    lg('BC3025', 'blogcatalog3', index=[0,1], norm=True, C=1e15, ic=230)

Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.231367291946
f1_micro (emb):  0.274049650892
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.240162489034
f1_micro (emb):  0.279480217223
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.234634939919
f1_micro (emb):  0.276280062064
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.257472767209
f1_micro (emb):  0.286462373933
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.243036177004
f1_micro (emb):  0.278219550039
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.250303983259
f1_micro (emb):  0.283359193173
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.24255831965
f1_micro (emb):  0.279286268425
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.242226100945
f1_micro (emb):  0.281710628394
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.246300652772
f1_micro (emb):  0.284522885958
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.241641796936
f1_micro (emb):  0.281322730799


In [63]:
# Test if balancing the class weight will give better results - Nope!
for _ in range(10):
    lg('BC3025', 'blogcatalog3', index=[0,1], norm=True, C=1e15, ic=230)

Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.224380957857
f1_micro (emb):  0.23283553142
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.223271052248
f1_micro (emb):  0.231380915438
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.221421182605
f1_micro (emb):  0.229538401862
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.223983957479
f1_micro (emb):  0.232156710628
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.230403768585
f1_micro (emb):  0.232738557021
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.22186299814
f1_micro (emb):  0.227986811482
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.215577851566
f1_micro (emb):  0.227114041893
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.21914005075
f1_micro (emb):  0.227889837083
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.229582394109
f1_micro (emb):  0.234775019395
Experiment  BC3025   blogcatalog3
f1_macro (emb):  0.222870394891
f1_micro (emb):  0.228083785881


In [64]:
# Test if balancing the class weight will give better results - Nope!
# NOTE: BC3012 is motif walk
for _ in range(10):
    lg('BC3012', 'blogcatalog3', index=[0,1], norm=True, C=1e10, ic=230)

Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.214191739416
f1_micro (emb):  0.22498060512
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.22357130585
f1_micro (emb):  0.228083785881
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.218972529614
f1_micro (emb):  0.225853374709
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.224612124085
f1_micro (emb):  0.231380915438
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.21616459147
f1_micro (emb):  0.227211016292
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.215718913787
f1_micro (emb):  0.227695888285
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.210375258756
f1_micro (emb):  0.219743987587
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.214906468457
f1_micro (emb):  0.224495733126
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.212082320573
f1_micro (emb):  0.228471683476
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.220601710571
f1_micro (emb):  0.232253685027


In [None]:
for _ in range(10):
    lg('BC3012', 'blogcatalog3', index=[0,1], norm=True, C=1e10, ic=230)

Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.238939110385
f1_micro (emb):  0.277249806051
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.243341618848
f1_micro (emb):  0.27812257564
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.238332321528
f1_micro (emb):  0.278801396431
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.235606345264
f1_micro (emb):  0.276474010861
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.23754928472
f1_micro (emb):  0.275504266874
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.235305996745
f1_micro (emb):  0.277152831652
Experiment  BC3012   blogcatalog3
f1_macro (emb):  0.233681557652
f1_micro (emb):  0.278704422033
