In [29]:
import pandas as pd
import json
import LLDA.model.labeled_lda as llda
import numpy as np
from sklearn.metrics import pairwise_distances
from scipy.spatial.distance import jensenshannon

In [54]:
with open('dim_sample.json') as f:
    all_data = json.load(f)

def get_unique_dis(data):
    disciplines = set()
    for pro_id in data.keys():
        disciplines.update(data[pro_id]['disciplines'])
    return disciplines

In [55]:
split = 180
train_data = {k: all_data[k] for k in list(all_data.keys())[:split]}
test_data = {k: all_data[k] for k in list(all_data.keys())[split:]}

train_project_data = {}
train_pub_data = []
for pro_id in train_data.keys():
    train_project_data[pro_id] = (train_data[pro_id]['title'], train_data[pro_id]['disciplines'])
    for pub_id in train_data[pro_id]['publications'].keys():
        train_pub_data.append((pub_id, train_data[pro_id]['publications'][pub_id]['title'], train_data[pro_id]['publications'][pub_id]['disciplines']))

test_project_data = {}
test_pub_data = []
for pro_id in test_data.keys():
    test_project_data[pro_id] = (test_data[pro_id]['title'], test_data[pro_id]['disciplines'])
    for pub_id in test_data[pro_id]['publications'].keys():
        test_pub_data.append((pub_id, test_data[pro_id]['publications'][pub_id]['title'], test_data[pro_id]['publications'][pub_id]['disciplines']))

print(len(train_project_data), len(train_pub_data))
print(len(test_project_data), len(test_pub_data))
print(len(get_unique_dis(train_data)), len(get_unique_dis({pub[0]: {'disciplines': pub[2]} for pub in train_pub_data})))

180 506
45 129
170 170


In [56]:
print(train_project_data[list(train_project_data.keys())[0]])
print(train_pub_data[0][1:])

('Quantifying trophic niches to measure the resilience of marine predators', ['4101', '4104', '3103'])
('Towards unlocking the trophic roles of rarely encountered squid: Opportunistic samples of Taningia danae and a Chiroteuthis aff. veranii reveal that the Southern Ocean top predators are nutrient links connecting deep-sea and shelf-slope environments', ['3103'])


In [57]:
# # load from disk
# llda_model_project = llda.LldaModel()
# llda_model_project.load_model_from_dir("LLDA/data_models/pro_abstracts_disciplines", load_derivative_properties=False)
# print("llda_model_project", llda_model_project)
# # print("Top-5 terms of topic 'virus': ", llda_model_project.top_terms_of_topic("virus", 5, False))
# print("Doc-Topic Matrix: \n", llda_model_project.theta)
# print("Topic-Term Matrix: \n", llda_model_project.beta)

In [58]:
llda_model_project = llda.LldaModel(labeled_documents=train_project_data.values())
print(llda_model_project)
llda_model_pub = llda.LldaModel(labeled_documents=[(pub[1], pub[2]) for pub in train_pub_data])
print(llda_model_pub)


Labeled-LDA Model:
	K = 171
	M = 180
	T = 1251
	WN = 2120
	LN = 281
	alpha = 0.29239766081871343
	eta = 0.001
	perplexity = 90.39256989643876
	

Labeled-LDA Model:
	K = 171
	M = 506
	T = 2987
	WN = 6374
	LN = 704
	alpha = 0.29239766081871343
	eta = 0.001
	perplexity = 201.0754566827323
	


In [59]:
# training
llda_model_project.training(iteration=10, log=True)
# while True:
#     print("iteration %s sampling..." % (llda_model.iteration + 1))
#     llda_model.training(1)
#     print("after iteration: %s, perplexity: %s" % (llda_model.iteration, llda_model.perplexity()))
#     print("delta beta: %s" % llda_model.delta_beta)
#     if llda_model.is_convergent(method="beta", delta=0.01):
#         break

after iteration: 0, perplexity: 90.39256989643876
gibbs sample count:  2120
after iteration: 1, perplexity: 39.92193920191872
gibbs sample count:  2120
after iteration: 2, perplexity: 36.904367522287714
gibbs sample count:  2120
after iteration: 3, perplexity: 36.22049551723303
gibbs sample count:  2120
after iteration: 4, perplexity: 35.19380352978232
gibbs sample count:  2120
after iteration: 5, perplexity: 35.30325445294307
gibbs sample count:  2120
after iteration: 6, perplexity: 34.10990889632067
gibbs sample count:  2120
after iteration: 7, perplexity: 34.212801494744745
gibbs sample count:  2120
after iteration: 8, perplexity: 33.5082742852733
gibbs sample count:  2120
after iteration: 9, perplexity: 33.429986347868635
gibbs sample count:  2120


In [60]:
llda_model_pub.training(iteration=10, log=True)

after iteration: 0, perplexity: 201.0754566827323
gibbs sample count:  6374
after iteration: 1, perplexity: 113.08582653475284
gibbs sample count:  6374
after iteration: 2, perplexity: 105.78100432659338
gibbs sample count:  6374
after iteration: 3, perplexity: 103.6696121806826
gibbs sample count:  6374
after iteration: 4, perplexity: 100.81403605884597
gibbs sample count:  6374
after iteration: 5, perplexity: 99.40253019969909
gibbs sample count:  6374
after iteration: 6, perplexity: 98.51498221680718
gibbs sample count:  6374
after iteration: 7, perplexity: 97.83194282569912
gibbs sample count:  6374
after iteration: 8, perplexity: 96.60624813930383
gibbs sample count:  6374
after iteration: 9, perplexity: 95.10814504066211
gibbs sample count:  6374


In [61]:
# # update
# print("before updating: ", llda_model)
# update_labeled_documents = [("new example test example test example test example test", ["example", "test"])]
# llda_model.update(labeled_documents=update_labeled_documents)
# print("after updating: ", llda_model)

# # train again
# # llda_model.training(iteration=10, log=True)
# while True:
#     print("iteration %s sampling..." % (llda_model.iteration + 1))
#     llda_model.training(1)
#     print("after iteration: %s, perplexity: %s" % (llda_model.iteration, llda_model.perplexity()))
#     print("delta beta: %s" % llda_model.delta_beta)
#     if llda_model.is_convergent(method="beta", delta=0.01):
#         break

In [62]:
# inference
# note: the result topics may be different for difference training, because gibbs sampling is a random algorithm
document = list(test_project_data.values())[0][0]
print(document)

topics = llda_model_project.inference(document=document, iteration=30, times=10)
# print sorted topics
sorted(topics, key=lambda x: x[0])

Center of Excellence in Complex Disease Genetics-from Discovery to Precision Medicine


[('3001', 0.005414771496642827),
 ('3002', 0.005414771496642827),
 ('3003', 0.005414771496642827),
 ('3004', 0.005414771496642827),
 ('3005', 0.005414771496642827),
 ('3006', 0.012822178904050215),
 ('3007', 0.005414771496642827),
 ('3008', 0.005414771496642827),
 ('3009', 0.005414771496642827),
 ('3101', 0.005414771496642827),
 ('3102', 0.005414771496642827),
 ('3103', 0.005414771496642827),
 ('3104', 0.005414771496642827),
 ('3105', 0.005414771496642827),
 ('3106', 0.005414771496642827),
 ('3107', 0.005414771496642827),
 ('3108', 0.005414771496642827),
 ('3109', 0.005414771496642827),
 ('3201', 0.005414771496642827),
 ('3202', 0.005414771496642827),
 ('3203', 0.005414771496642827),
 ('3204', 0.005414771496642827),
 ('3205', 0.005414771496642827),
 ('3206', 0.005414771496642827),
 ('3207', 0.005414771496642827),
 ('3208', 0.005414771496642827),
 ('3209', 0.005414771496642827),
 ('3210', 0.005414771496642827),
 ('3211', 0.005414771496642827),
 ('3212', 0.007266623348494674),
 ('3213', 

In [63]:
documents = list(test_project_data.values())
project_matrix_test = np.zeros((len(documents), llda_model_project.K))

for i, (document, _) in enumerate(documents):
    topics = llda_model_project.inference(document=document, iteration=100, times=10)
    sorted_topics = sorted(topics, key=lambda x: x[0])
    for j, (topic, prob) in enumerate(sorted_topics):
        project_matrix_test[i, j] = prob

project_matrix_test

array([[0.00541477, 0.00541477, 0.00541477, ..., 0.00541477, 0.00541477,
        0.05726662],
       [0.00551694, 0.00551694, 0.00551694, ..., 0.00551694, 0.00551694,
        0.04136599],
       [0.00562303, 0.00562303, 0.00562303, ..., 0.00562303, 0.00562303,
        0.03062303],
       ...,
       [0.00541477, 0.00541477, 0.00541477, ..., 0.00541477, 0.00541477,
        0.04985922],
       [0.00551694, 0.00551694, 0.00551694, ..., 0.00551694, 0.00551694,
        0.04702637],
       [0.00562303, 0.00562303, 0.00562303, ..., 0.00562303, 0.00562303,
        0.02100765]])

In [64]:
documents = [(pub[1], pub[2]) for pub in test_pub_data]
pub_matrix_test = np.zeros((len(documents), llda_model_pub.K))

for i, (document, _) in enumerate(documents):
    topics = llda_model_pub.inference(document=document, iteration=100, times=10)
    sorted_topics = sorted(topics, key=lambda x: x[0])
    for j, (topic, prob) in enumerate(sorted_topics):
        pub_matrix_test[i, j] = prob

pub_matrix_test

array([[0.00471609, 0.00471609, 0.00471609, ..., 0.00471609, 0.00471609,
        0.05471609],
       [0.0071345 , 0.00531632, 0.00531632, ..., 0.00531632, 0.00531632,
        0.0071345 ],
       [0.00495589, 0.00495589, 0.00495589, ..., 0.00495589, 0.00495589,
        0.01851521],
       ...,
       [0.00487329, 0.00487329, 0.00487329, ..., 0.00487329, 0.00487329,
        0.02487329],
       [0.00643275, 0.0047934 , 0.0047934 , ..., 0.0047934 , 0.0047934 ,
        0.02282619],
       [0.00464123, 0.00622853, 0.00464123, ..., 0.00464123, 0.00464123,
        0.02368885]])

In [65]:
project_matrix = np.concatenate((llda_model_project.theta, project_matrix_test))
pub_matrix = np.concatenate((llda_model_pub.theta, pub_matrix_test))

distance_matrix = np.zeros((len(project_matrix), len(pub_matrix)))

for i in range(len(project_matrix)):
    for j in range(len(pub_matrix)):
        distance_matrix[i, j] = jensenshannon(project_matrix[i], pub_matrix[j])

In [68]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
# create a dataframe with row indices as project ids and column indices as publication ids
# if publication is in project, then 1, else 0
# if publication date is before project start date, then 0, else 1
# ratio of intersection of organisations from project and publication to organisations from publication
# ratio of intersection of authors from project and publication to authors from publication

all_data = {**train_data, **test_data}
pub_data = []
for pro_id in all_data.keys():
    for pub_id in all_data[pro_id]['publications'].keys():
        pub_data.append((pub_id, all_data[pro_id]['publications'][pub_id]))

data_matrix = [[0.] * len(pub_data) for _ in range(len(all_data))]
for i, pro_id in enumerate(all_data.keys()):
    for j, pub_id in enumerate([pub[0] for pub in pub_data]):
        belongs = 1 if pub_id in all_data[pro_id]['publications'].keys() else 0
        distance = distance_matrix[i, j]
        data_matrix[i][j] = [belongs, distance]

df = pd.DataFrame(distance_matrix, index=all_data.keys(), columns=[pub[0] for pub in pub_data])
df.to_csv('distance_dim_title.csv')
df.head()

Unnamed: 0,10.3389/fmars.2023.1254461,10.1007/978-3-031-49133-7_8,10.1007/978-3-031-43619-2_15,10.1080/11663081.2023.2246863,10.1177/03057356231165327,10.1016/j.jconrel.2024.05.037,10.1007/s13346-024-01618-6,10.1002/smll.202303682,10.1371/journal.pone.0298895,10.1007/s00334-024-00992-y,10.1038/s41598-023-44445-4,10.1101/2023.09.15.557939,10.1016/j.jasrep.2023.104204,10.1016/j.palaeo.2023.111655,10.1007/jhep05(2024)154,10.1140/epjc/s10052-024-12711-y,10.1140/epjc/s10052-024-12416-2,10.1140/epjc/s10052-024-12415-3,10.1007/jhep02(2024)124,10.1007/jhep11(2023)103,10.1007/jhep06(2023)086,10.1093/iob/obad026,10.1007/s00359-023-01629-7,10.1101/2023.03.11.531676,10.1093/mnras/stae997,10.1093/mnras/stae616,10.1051/0004-6361/202348958,10.1093/mnras/stad3163,10.1093/mnras/stad2183,10.1101/2024.01.14.574481,10.1007/s40313-024-01095-9,10.1109/tpwrs.2023.3321700,10.1109/tits.2024.3392914,10.1007/978-981-97-0989-2_24,10.1109/tsc.2023.3332701,10.1007/978-3-031-48424-7_15,10.1007/978-3-031-48424-7_13,10.1145/3631353,10.1145/3629517,10.1109/icdcs57875.2023.00111,10.1109/icws60048.2023.00056,10.1109/icws60048.2023.00031,10.1109/icws60048.2023.00068,10.1109/tsc.2023.3307143,10.1145/3600232,10.1109/mic.2023.3267266,10.1109/tsc.2023.3241975,10.1109/tmc.2022.3230856,10.1007/978-3-031-20984-0_9,10.1109/tsc.2022.3160469,10.3389/fneur.2023.1182561,10.1038/s41598-024-57498-w,10.1016/j.jmrt.2023.11.014,10.1016/j.jmst.2023.05.020,10.1016/j.fuel.2023.130187,10.1017/9781009297349,10.1007/s11229-023-04282-4,10.3390/rel14060758,10.1002/smsc.202400096,10.1016/j.actpsy.2024.104252,10.1080/02691728.2024.2326828,10.5964/ejop.12031,10.1111/jopy.12805,10.1109/lsp.2023.3277792,10.21203/rs.3.rs-3644422/v1,10.1016/j.renene.2024.120101,10.1093/rheumatology/kead301,10.1097/mlr.0000000000002000,10.1111/tmi.13827,10.1063/5.0167167,10.1021/acsami.2c19376,10.1021/acsanm.2c05047,10.1101/2024.05.21.595254,10.1038/s41467-024-47964-4,10.1093/jb/mvae021,10.1016/j.neuron.2024.01.014,10.1016/j.isci.2023.107385,10.1016/j.peptides.2023.171051,10.3389/fphar.2023.1138666,10.3389/fphar.2023.1098976,10.1186/s43058-023-00521-4,10.1177/26334895231199467,10.1002/adom.202303199,10.1002/adom.202301232,10.1016/j.energy.2024.130322,10.1126/sciimmunol.abo4365,10.1515/sem-2023-0178,10.1364/boe.506664,10.1364/boe.494585,10.3847/1538-4357/ac4601,10.1371/journal.pone.0284416,10.1080/07350015.2023.2271039,10.1093/mnras/stae385,10.1093/mnras/stad2760,10.1002/ange.202320045,10.1002/anie.202320045,10.1016/j.chembiol.2024.02.012,10.1101/2023.11.29.569293,10.1038/s41467-023-41197-7,10.35772/ghm.2023.01065,10.3390/v15040896,10.1111/dar.13836,10.1063/5.0153862,10.1109/imoc57131.2023.10379741,10.1109/imoc57131.2023.10379729,10.1109/access.2023.3339563,10.1109/ojpel.2023.3339014,10.1109/csci58124.2022.00203,10.1016/j.ssci.2022.105967,10.1007/978-3-031-06015-1_8,10.1101/2023.01.19.524726,10.1007/s00382-023-07058-1,10.1002/oa.3284,10.1136/bmjopen-2023-080603,10.1101/2023.08.02.551649,10.1099/mgen.0.000965,10.2140/ant.2022.16.2005,10.1103/physrevlett.132.103402,10.21468/scipostphys.15.2.068,10.1080/02606755.2023.2213550,10.3390/rs15204928,10.1063/5.0203603,10.1103/physrevapplied.21.054027,10.1109/icecom58258.2023.10367924,10.1109/icecom58258.2023.10367934,10.1109/icecom58258.2023.10367938,10.1109/icecom58258.2023.10367923,10.1109/metamaterials58257.2023.10289546,10.23919/ursigass57860.2023.10265525,10.1109/elmar59410.2023.10253914,10.1002/pen.26771,10.1016/j.canep.2023.102451,10.3390/biomedicines11051344,10.3390/pharmaceutics15010181,10.1037/fam0001189,10.3390/su15129371,10.1038/s44221-024-00208-7,10.1093/evolut/qpae036,10.1093/evolut/qpae024,10.3390/micro4010008,10.3390/molecules28196822,10.1007/s11673-023-10285-0,10.1021/acsnano.3c09776,10.1101/2023.09.08.556607,10.1016/j.snb.2023.133733,10.1016/j.ocecoaman.2023.106961,10.1016/j.tre.2023.103169,10.1016/j.elerap.2023.101336,10.1590/0001-3765202320230351,10.1590/s1678-3921.pab2023.v58.03246,10.1038/s41598-024-56540-1,10.1364/ol.494369,10.1017/s0963180124000112,10.1136/jme-2023-109568,10.1111/japp.12655,10.1038/s41539-023-00170-1,10.1016/j.neubiorev.2023.105153,10.1007/s00158-023-03663-0,10.3390/ma16145076,10.1007/978-3-031-55260-1_15,10.1007/s11228-024-00719-1,10.1007/s00205-023-01948-8,10.1142/s0219199723500657,10.1007/s12220-023-01484-7,10.1007/s10957-023-02344-8,10.1007/978-3-031-46359-4_2,10.1007/s10208-023-09629-4,10.1007/s00245-023-10029-x,10.1007/s00028-023-00902-1,10.1016/j.jde.2023.06.004,10.1007/s00030-023-00857-9,10.1007/s11579-023-00333-z,10.1061/jmenea.meeng-5794,10.1177/21695067231194338,10.1038/s41597-024-03034-4,10.1039/d3ew00347g,10.1101/2024.05.17.24307550,10.1101/2024.01.09.24301073,10.1038/s41598-023-41853-4,10.1111/sjos.12685,10.1038/s41593-023-01321-8,10.1016/j.jclinepi.2023.02.020,10.1371/journal.pone.0280192,10.1016/j.jbi.2022.104243,10.1016/j.eclinm.2022.101724,10.38107/037,10.1002/adfm.202314696,10.1063/5.0168129,10.1103/physrevmaterials.7.064202,10.1038/s41699-023-00404-1,10.1061/jsendh.steng-12655,10.1186/s40623-023-01940-2,10.1029/2022ja031231,10.1029/2023ja031663,10.1029/2022gl101465,10.21203/rs.3.rs-4345687/v1,10.1093/toxsci/kfae021,10.1101/2023.08.28.555101,10.1103/physrevb.109.205125,10.1111/cgf.14942,10.1109/tpami.2022.3163720,10.1016/j.csl.2024.101623,10.1039/d0sc01737j,10.1186/s12889-023-17570-y,10.1080/13218719.2023.2243303,10.5694/mja2.52089,10.1177/00938548231170799,10.1007/s11150-024-09710-z,10.1016/j.jbankfin.2023.107047,10.1016/j.euroecorev.2023.104632,10.1038/s41598-023-30724-7,10.1038/s41598-023-29536-6,10.1111/obes.12545,10.1016/j.jebo.2022.11.027,10.3389/fimmu.2023.1060258,10.1016/j.jhydrol.2024.130983,10.1101/2024.03.18.585583,10.1016/j.celrep.2024.113675,10.1103/physrevx.14.021017,10.1038/s41559-024-02331-w,10.1016/j.gloplacha.2024.104354,10.1038/s41467-023-41685-w,10.1126/sciadv.adg7679,10.1144/sp532-2022-1,10.1523/jneurosci.0226-23.2023,10.1101/2023.01.11.523491,10.1073/pnas.2309379120,10.1073/pnas.2301947120,10.1038/s41467-024-48673-8,10.1038/s41467-024-47953-7,10.1016/j.fsigen.2024.103048,10.1093/bib/bbad163,10.1101/2023.12.12.570420,10.1016/j.celrep.2023.113331,10.1103/physrevd.108.105013,10.1007/jhep11(2023)005,10.1101/2024.01.29.574039,10.1126/scitranslmed.adi9711,10.3390/cancers15143723,10.1021/acsnano.3c11337,10.1038/s41467-023-36133-8,10.1016/j.cobme.2024.100547,10.1002/ange.202319567,10.1002/anie.202319567,10.1016/j.jfca.2023.105901,10.1016/j.foodcont.2023.109969,10.1016/j.respol.2024.104954,10.1371/journal.pbio.3002513,10.1109/qce57702.2023.00111,10.1109/iccad57390.2023.10323863,10.1016/j.ic.2023.105077,10.1145/3582016.3582039,10.1109/tcad.2022.3179223,10.1145/3517145,10.1016/j.tcs.2022.02.017,10.1145/3514355,10.1145/3514239,10.1038/s41598-024-51799-w,10.3390/cells12242815,10.5771/9783748935544,10.1016/j.eswa.2024.124100,10.1016/j.frl.2024.105308,10.12688/openreseurope.16436.1,10.12688/openreseurope.16278.1,10.12688/openreseurope.15386.1,10.3390/foods12244484,10.1057/s42984-024-00090-3,10.1002/anie.202315985,10.1002/ange.202315985,10.1161/atvbaha.123.319821,10.1093/cvr/cvad149,10.1161/strokeaha.123.042714,10.1016/j.jtha.2023.04.002,10.1182/bloodadvances.2023010100,10.3389/fphar.2024.1379236,10.1101/2023.07.03.547532,10.1103/physreve.107.l052602,10.1063/5.0133871,10.1109/icnwc57852.2023.10127328,10.1016/j.atech.2023.100265,10.1016/j.cct.2023.107387,10.1155/2023/2397564,10.1007/s10502-024-09441-1,10.1111/gcb.16637,10.3390/ma16051978,10.21203/rs.3.rs-4271873/v1,10.1038/s41419-024-06693-8,10.1038/s41598-024-56928-z,10.1016/j.chemgeo.2024.122157,10.1016/j.chemgeo.2022.121064,10.2343/geochemj.gj22004,10.1016/j.jwpe.2023.104395,10.1016/j.jece.2023.111107,10.1080/02614367.2022.2162109,10.1109/twc.2024.3400601,10.1109/globecom54140.2023.10437972,10.1109/twc.2023.3344802,10.1109/tifs.2023.3268443,10.1093/ptep/ptae021,10.1021/accountsmr.4c00071,10.26434/chemrxiv-2024-hvxml,10.1039/d4nr01024h,10.1038/s42004-024-01143-0,10.1039/d3dd00236e,10.1039/d3tc03606e,10.1021/acs.chemmater.3c01744,10.1021/acs.inorgchem.3c02337,10.1063/5.0144827,10.1002/anie.202314378,10.1002/ange.202314378,10.1039/d3ta04707e,10.1039/d3ce00881a,10.1002/asia.202300673,10.1038/s41467-023-38737-6,10.26434/chemrxiv-2023-d1s8w,10.1002/adma.202211478,10.1145/3589334.3645329,10.1029/2023gl104396,10.20396/cel.v65i00.8673331,10.1016/j.procs.2023.08.230,10.1371/journal.pbio.3001984,10.1101/2022.04.22.489138,10.1002/brb3.3490,10.1016/j.clinph.2024.04.002,10.1111/ejn.16001,10.3389/fneur.2023.1177589,10.1016/j.clinph.2022.08.015,10.1101/2024.05.23.24307833,10.1093/ofid/ofad655,10.1093/ofid/ofae018,10.1371/journal.pone.0297775,10.21203/rs.3.rs-2640564/v3,10.1002/saj2.20688,10.1071/sr23164,10.1029/2023gl104852,10.1038/s41598-022-10957-8,10.1186/s40623-022-01584-8,10.1111/nph.19336,10.3389/fpsyg.2022.1014713,10.3390/v15102029,10.3389/fnut.2023.1215768,10.3390/educsci13080838,10.12688/routledgeopenres.17798.2,10.12688/routledgeopenres.17798.1,10.1080/00031305.2023.2232006,10.1080/0969725x.2023.2270357,10.1177/00345237231183343,10.1016/j.ijheatmasstransfer.2023.124665,10.1039/d3qm01106b,10.1016/j.mechmachtheory.2023.105508,10.1016/j.scib.2024.02.010,10.1088/1674-4527/ace179,10.1126/science.abl7759,10.1016/j.scitotenv.2024.172840,10.1016/j.envint.2024.108601,10.1016/j.envint.2024.108454,10.1016/j.envint.2023.108375,10.1016/j.envres.2023.117611,10.1016/j.envres.2023.117832,10.2337/dc23-0327,10.1021/acs.est.3c02765,10.1021/acs.est.3c00848,10.1007/s40726-023-00269-4,10.1021/acs.analchem.3c00376,10.1289/ehp11372,10.1101/2023.02.09.527886,10.3390/make6020035,10.1016/j.micromeso.2024.113042,10.3390/make6010014,10.1016/j.compag.2024.108650,10.1038/s41598-023-34320-7,10.1016/j.compag.2022.107325,10.1145/3615894.3628507,10.1016/j.scs.2023.104435,10.1093/jipm/pmac028,10.1145/3651171,10.1016/j.clsr.2024.105934,10.1145/3594739.3605113,10.1093/lambio/ovae041,10.1007/s12155-024-10734-7,10.1016/j.carres.2024.109068,10.1007/s00253-023-12908-3,10.1007/s00289-024-05152-w,10.3390/polysaccharides4020013,10.3389/fagro.2023.1148969,10.1038/s41586-024-07473-2,10.1101/2023.11.30.569198,10.1186/s13015-024-00254-6,10.1007/978-1-0716-3989-4_3,10.4230/lipics.wabi.2023.17,10.1186/s13015-024-00261-7,10.1101/2023.11.22.568259,10.1093/gbe/evad205,10.1101/gr.277679.123,10.1101/2023.06.21.545862,10.1145/3571723,10.1101/2023.05.12.540616,10.1101/2023.03.02.530874,10.1101/2023.01.30.526175,10.1101/2022.12.23.521809,10.1038/s41390-023-02992-6,10.1001/jama.2023.20358,10.1542/hpeds.2023-007246,10.1016/j.jpeds.2023.113499,10.1093/jamia/ocad053,10.1093/jamia/ocac251,10.1038/s41598-024-54655-z,10.1172/jci175031,10.3389/fgene.2023.1304425,10.1186/s13578-023-01102-7,10.1016/j.gendis.2022.11.003,10.1002/mp.16880,10.1002/mp.16352,10.1016/j.scitotenv.2022.158267,10.1016/j.foreco.2022.120301,10.1016/j.ecolind.2022.109004,10.1073/pnas.2318333121,10.1063/5.0158930,10.1145/3588432.3591521,10.1063/5.0142166,10.1038/s41467-024-46494-3,10.1128/mbio.02479-23,10.1101/2023.09.08.556855,10.1101/2023.08.31.555785,10.1186/s40168-022-01378-w,10.1101/2023.12.18.572279,10.1093/nar/gkad1164,10.1101/2023.12.03.569795,10.1101/2023.07.26.550759,10.1186/s12864-023-09265-w,10.1021/acsanm.3c05701,10.1016/j.apsusc.2023.158316,10.1080/03057240.2024.2333577,10.3390/rel14121517,10.3390/rel14111427,10.1109/icops45740.2023.10480948,10.1109/icops45740.2023.10481052,10.1109/icops45740.2023.10481130,10.1038/s41598-024-51298-y,10.1109/ppc47928.2023.10311041,10.1109/ppc47928.2023.10310918,10.1049/hve2.12382,10.21203/rs.3.rs-3143506/v1,10.4271/03-16-08-0061,10.1080/02560046.2024.2316302,10.1177/01634437231219141,10.1177/16094069231182015,10.1177/00113921231182182,10.1002/cjce.25286,10.1080/07373937.2024.2318437,10.1016/j.etap.2024.104382,10.1080/19440049.2023.2283769,10.3390/ani13152499,10.1016/j.jet.2024.105798,10.1038/s41467-023-41107-x,10.1016/j.oneear.2023.05.006,10.1088/1748-9326/acd5e8,10.1088/1748-9326/aca815,10.1145/3617232.3624856,10.1109/cloudcom59040.2023.00047,10.1007/s11761-024-00391-1,10.1109/percomworkshops56833.2023.10150370,10.1016/j.comcom.2023.04.027,10.1109/apsec57359.2022.00034,10.1109/cloudcom55334.2022.00016,10.1371/journal.pone.0285434,10.1186/s13578-023-01012-8,10.1161/strokeaha.122.041651,10.1080/15534510.2023.2279662,10.1111/nana.12994,10.1080/14680777.2023.2258298,10.1038/s41598-023-35252-y,10.1177/10596011231193176,10.1016/j.jhin.2023.03.002,10.1177/10596011221150756,10.1080/08039488.2024.2322495,10.1007/s00787-024-02406-w,10.1142/s0219877024500275,10.1155/2023/2516746,10.1080/08039488.2023.2222698,10.3389/fpsyg.2023.1183704,10.1111/acer.15119,10.1080/20008066.2023.2191396,10.1007/s00787-022-02107-2,10.1007/s11218-022-09734-2,10.1016/j.rssm.2023.100876,10.3390/f15020354,10.1007/s11629-023-8914-3,10.14746/quageo-2023-0016,10.18146/view.297,10.18146/tmg.835,10.5117/9789463727815,10.1177/08912424231163485,10.1007/978-94-6265-515-7,10.1038/s41467-023-41057-4,10.1093/gigascience/giad047,10.1038/s41592-023-01886-z,10.1093/nar/gkad289,10.1101/2023.01.21.525030,10.1016/j.gpb.2022.09.011,10.1021/acs.jpcb.4c01987,10.1021/acs.jctc.3c00663,10.1021/acs.jpcb.3c04473,10.26434/chemrxiv-2023-w0h1p,10.1073/pnas.2305899120,10.1101/2023.05.01.538927,10.1101/2023.12.22.23300430,10.1002/agt2.386,10.1002/adfm.202214179,10.1109/milcom58377.2023.10356332,10.1101/2024.05.03.24306699,10.1101/2024.04.16.24305925,10.1101/2023.10.25.23297571,10.3389/fphys.2023.1202186,10.1103/physrevb.109.205301,10.1103/physrevb.108.195303,10.1523/eneuro.0197-23.2023,10.3390/v15091897,10.1016/j.prdoa.2024.100251,10.3390/ijms24108995,10.3390/ijms24032247,10.1016/j.isci.2023.108171,10.1158/2326-6066.cir-23-0496,10.1101/2023.12.07.570715,10.1016/j.cell.2023.11.008,10.1093/abt/tbad025,10.1016/j.celrep.2023.113280,10.1101/2023.06.18.545488,10.3390/cancers15102788,10.1101/2023.03.07.531525,10.1080/13543784.2023.2179482,10.1016/j.bbrc.2022.09.019,10.3389/fimmu.2022.996026,10.1111/liv.15927,10.1101/2023.11.17.23298672,10.1111/liv.15665,10.1016/j.cgh.2023.04.016,10.1016/j.jhepr.2022.100667,10.1007/s11914-023-00843-1,10.1007/s11914-023-00842-2,10.1007/s11914-023-00855-x,10.3390/rs15235545,10.1029/2022gl102689,10.3390/rs14236069,10.1038/s41467-024-46327-3,10.1002/cam4.6761,10.3389/fonc.2023.1100585,10.1109/vtc2023-fall60731.2023.10333522,10.1128/jvi.00100-23,10.1021/acs.jpcc.3c05477,10.1021/acsaem.3c01370,10.3389/fnins.2023.1217993,10.1016/j.visres.2023.108296,10.1016/j.jad.2023.07.014,10.1001/jamanetworkopen.2023.17905,10.1007/s00371-024-03454-8,10.1109/smc53992.2023.10394105,10.1007/s00521-023-09367-2,10.1145/3582700.3582707,10.1007/s10803-024-06302-9,10.1016/j.psychres.2024.115838,10.1016/j.rasd.2024.102339,10.1177/13623613231213543,10.1007/s10803-023-06039-x,10.1016/j.jplph.2023.154138,10.1016/j.freeradbiomed.2024.04.217,10.1016/j.freeradbiomed.2023.06.021,10.1093/jncimonographs/lgad014,10.1038/s41467-023-37269-3,10.1111/liv.15893,10.1101/2023.04.25.538102,10.1063/5.0142200,10.1016/b978-0-323-95124-1.00017-6,10.1101/2023.05.17.541187,10.1101/2023.05.17.541174,10.1007/s00415-024-12430-0,10.1093/ntr/ntae084,10.1093/schbul/sbae024,10.1038/s41386-024-01842-1,10.21203/rs.3.rs-3168186/v1,10.1101/2023.08.21.23294348,10.1038/s41380-023-02165-1,10.1136/bmjopen-2022-066249,10.1038/s41585-024-00869-9,10.1158/0008-5472.can-23-0555,10.1101/2022.11.02.514910,10.3390/s24072335,10.1109/sensors56945.2023.10324963,10.1038/s41528-023-00258-z,10.3390/bios12050322,10.1371/journal.pone.0288803,10.3389/fpubh.2023.1219676,10.1016/j.soard.2023.09.026,10.3389/fpsyg.2023.1106571,10.2196/46415,10.1101/2023.04.20.23288698,10.1111/joes.12620,10.1101/2024.04.22.24306094,10.1007/s00401-024-02721-1,10.1101/2024.02.28.582621,10.1016/j.neuron.2024.01.008,10.1002/alz.13576,10.1001/jamaneurol.2023.3599,10.1186/s40478-023-01626-6,10.1111/acel.13938,10.1101/2023.07.20.23292771,10.1101/2023.07.06.23292312,10.1101/2023.04.21.23288938,10.1186/s13024-022-00590-4,10.1186/s13058-024-01777-x,10.1117/1.jmi.10.5.054503,10.1002/mp.17040,10.1016/j.brat.2024.104494,10.1176/appi.ajp.20230272,10.1001/jamapsychiatry.2023.5138,10.1016/j.addbeh.2023.107911,10.1016/j.explore.2023.11.001,10.1038/s44220-023-00084-2,10.1007/s40429-023-00501-7,10.1016/j.drugalcdep.2023.109890,10.1145/3631461.3631550,10.1016/j.jcss.2023.02.004,10.1080/15384101.2021.2023304,10.3390/ijms241713272,10.1016/j.jval.2024.01.020,10.1038/s41366-023-01396-0,10.1021/acs.jpcc.3c04680,10.1021/acs.jpcc.4c01814,10.4025/actascilangcult.v45i2.67723,10.1007/s10915-023-02353-9,10.1007/s42967-023-00287-5,10.1007/s10543-023-00954-2,10.1128/jvi.00398-22,10.1093/genetics/iyad216,10.1101/2023.10.17.562696
9852805,0.664279,0.71603,0.804951,0.66443,0.792039,0.706248,0.662371,0.636286,0.653481,0.656585,0.689969,0.631099,0.67478,0.675269,0.697217,0.652161,0.59892,0.620646,0.719614,0.673319,0.79326,0.598898,0.650244,0.598898,0.656585,0.742095,0.679409,0.656585,0.709277,0.706248,0.656585,0.713827,0.713827,0.804158,0.695196,0.668766,0.792039,0.708587,0.647683,0.640871,0.797793,0.722118,0.792039,0.780526,0.666128,0.792039,0.799811,0.666128,0.708587,0.792039,0.696604,0.6617,0.619911,0.71245,0.658831,0.706248,0.700098,0.659524,0.780526,0.650244,0.671416,0.73565,0.656585,0.686618,0.660737,0.807062,0.666554,0.701813,0.671416,0.758636,0.79901,0.697638,0.631099,0.689969,0.649179,0.705377,0.727629,0.713827,0.667681,0.669279,0.636217,0.723802,0.723802,0.697328,0.671416,0.677691,0.688542,0.710821,0.666128,0.656585,0.71603,0.693131,0.674421,0.721966,0.701813,0.681717,0.674421,0.656585,0.677691,0.705409,0.637456,0.806735,0.656585,0.673423,0.645369,0.650663,0.655838,0.659524,0.694022,0.706248,0.694022,0.689969,0.656585,0.795718,0.713827,0.729486,0.754409,0.681078,0.671416,0.699279,0.636689,0.650244,0.640871,0.666843,0.640871,0.645369,0.649179,0.656585,0.706248,0.627468,0.670939,0.630881,0.67711,0.692766,0.677781,0.67085,0.667681,0.657105,0.615686,0.697532,0.695196,0.706248,0.705409,0.701669,0.679409,0.806399,0.726088,0.807689,0.631099,0.656585,0.676648,0.714368,0.713827,0.804316,0.656585,0.707682,0.807062,0.806053,0.695196,0.674421,0.695613,0.754409,0.719382,0.74956,0.593965,0.656585,0.687657,0.678959,0.706248,0.651041,0.688542,0.621793,0.593061,0.626768,0.658604,0.676299,0.653762,0.645849,0.6617,0.646348,0.656585,0.688204,0.638822,0.637456,0.6617,0.706662,0.689969,0.658604,0.647683,0.74956,0.707682,0.687657,0.67085,0.731143,0.730553,0.650244,0.636828,0.695613,0.77424,0.65143,0.663245,0.695196,0.770147,0.695871,0.69459,0.634327,0.666649,0.656585,0.663707,0.626768,0.667681,0.656585,0.712934,0.677781,0.668766,0.667681,0.707682,0.681717,0.656585,0.662922,0.691361,0.659397,0.711157,0.645369,0.590056,0.590056,0.697328,0.71603,0.662371,0.623636,0.709277,0.606403,0.697217,0.667681,0.66443,0.737269,0.705409,0.748002,0.687657,0.684203,0.705377,0.697328,0.743923,0.805329,0.667681,0.713058,0.671416,0.786491,0.80057,0.701813,0.785886,0.791499,0.656585,0.788685,0.792039,0.66443,0.647683,0.666128,0.742095,0.674421,0.62823,0.656585,0.666554,0.693698,0.71603,0.687657,0.713827,0.714368,0.714368,0.679824,0.656585,0.677691,0.699279,0.693279,0.674421,0.666128,0.783958,0.678959,0.671416,0.656585,0.697158,0.717191,0.799811,0.622055,0.751416,0.666128,0.666128,0.660031,0.66443,0.715836,0.67323,0.676299,0.694975,0.668609,0.689969,0.658978,0.658331,0.695613,0.652155,0.613933,0.626768,0.633574,0.805329,0.687657,0.64325,0.656585,0.694022,0.637456,0.67085,0.681325,0.626768,0.677691,0.723802,0.677781,0.640871,0.676648,0.804861,0.679409,0.808041,0.803313,0.63267,0.63267,0.645076,0.648277,0.689969,0.699262,0.679824,0.644776,0.649179,0.672576,0.633529,0.633529,0.684931,0.653481,0.727629,0.666128,0.67478,0.649321,0.758502,0.685847,0.742095,0.663245,0.69168,0.69168,0.687657,0.766078,0.720369,0.667681,0.643848,0.683691,0.646348,0.68337,0.695196,0.639072,0.619911,0.625345,0.658604,0.748227,0.71806,0.645002,0.686305,0.636828,0.552302,0.727629,0.651041,0.7036,0.613933,0.630733,0.623003,0.616902,0.627468,0.616902,0.671416,0.7036,0.678959,0.688204,0.653138,0.735086,0.656585,0.667681,0.643709,0.649179,0.656585,0.73565,0.667681,0.661287,0.661287,0.645431,0.805696,0.787454,0.787104,0.666128,0.652161,0.66443,0.780526,0.805329,0.668766,0.652161,0.656585,0.676648,0.638389,0.640871,0.689969,0.656585,0.632648,0.656585,0.647425,0.758636,0.662371,0.68337,0.7036,0.669153,0.688771,0.676648,0.67085,0.635712,0.635478,0.776435,0.673423,0.606403,0.656585,0.656585,0.656585,0.701813,0.684471,0.688542,0.688204,0.656585,0.688204,0.688542,0.67478,0.668609,0.631454,0.706248,0.719382,0.651041,0.656585,0.627468,0.6617,0.640871,0.656585,0.676648,0.6617,0.715836,0.694022,0.709277,0.700723,0.688204,0.694022,0.66443,0.545972,0.672576,0.685847,0.656585,0.669279,0.768064,0.54038,0.694022,0.713827,0.782668,0.701813,0.658604,0.734132,0.652161,0.685599,0.6617,0.759769,0.703889,0.679409,0.653481,0.666649,0.694022,0.681221,0.665449,0.630733,0.660079,0.661903,0.621793,0.651302,0.681717,0.808283,0.708892,0.661169,0.653424,0.647944,0.677691,0.61651,0.66443,0.650226,0.64045,0.726088,0.779561,0.678795,0.708587,0.714368,0.631099,0.646364,0.677691,0.697328,0.697217,0.652155,0.660737,0.804951,0.697328,0.647683,0.647683,0.796123,0.804158,0.805696,0.790472,0.77504,0.8046,0.780876,0.806053,0.805329,0.803313,0.800557,0.804951,0.803743,0.803313,0.805329,0.804158,0.804561,0.804034,0.804158,0.804561,0.804951,0.800557,0.798455,0.804158,0.805859,0.802468,0.804951,0.804158,0.804561,0.806053,0.803743,0.803313,0.805696,0.805696,0.806082,0.800555,0.801894,0.803743,0.804951,0.798522,0.80287,0.803743,0.79313,0.803743,0.805696,0.799938,0.803313,0.807689,0.806399,0.804561,0.803313,0.803313,0.806399,0.79321,0.798338,0.800989,0.806053,0.806519,0.802402,0.804034,0.796202,0.80197,0.806053,0.803743,0.802897,0.797319,0.805329,0.803635,0.799249,0.794657,0.805696,0.806053,0.805859,0.806519,0.798998,0.805783,0.806703,0.804004,0.803279,0.804951,0.799901,0.803313,0.80287,0.803743,0.805188,0.803105,0.795284,0.79095,0.792681,0.798338,0.802253,0.803635,0.804951,0.803205,0.804951,0.804951,0.802814,0.805329,0.806053,0.804951,0.805859,0.802878,0.804158,0.799502,0.804561,0.804158,0.804158,0.806735,0.805696,0.805329,0.785312,0.802774,0.805696,0.804936,0.803313,0.801936,0.803743,0.800922,0.807445,0.804204,0.805329,0.803635,0.802411,0.792228,0.802092,0.803635,0.80367,0.806399,0.807062
13062422,0.656467,0.673057,0.815195,0.584465,0.783319,0.657182,0.580665,0.530483,0.563997,0.569866,0.629842,0.520015,0.603238,0.604111,0.642161,0.561485,0.450684,0.498369,0.678771,0.60062,0.784908,0.534678,0.55782,0.534678,0.569866,0.713424,0.611462,0.569866,0.662141,0.657182,0.569866,0.669517,0.669517,0.814673,0.638749,0.592395,0.783319,0.661015,0.552892,0.539593,0.790754,0.682734,0.783319,0.768058,0.587582,0.783319,0.79333,0.587582,0.661015,0.783319,0.641128,0.579422,0.496817,0.667294,0.574079,0.657182,0.646991,0.575372,0.768058,0.55782,0.597195,0.703697,0.569866,0.624065,0.577633,0.816582,0.588362,0.64985,0.597195,0.737638,0.79231,0.642869,0.520015,0.629842,0.555775,0.655749,0.691361,0.669517,0.590419,0.593327,0.530344,0.685383,0.685383,0.642346,0.597195,0.608422,0.627388,0.664654,0.587582,0.569866,0.673057,0.635245,0.602595,0.682493,0.64985,0.615524,0.602595,0.569866,0.608422,0.655801,0.53282,0.816367,0.569866,0.600807,0.548405,0.558623,0.568458,0.575372,0.636759,0.657182,0.636759,0.629842,0.569866,0.785458,0.669517,0.69424,0.731552,0.614402,0.597195,0.645621,0.53129,0.55782,0.539593,0.58889,0.539593,0.548405,0.555775,0.569866,0.657182,0.512583,0.596334,0.519571,0.607391,0.634623,0.608582,0.596172,0.590419,0.621138,0.569866,0.64269,0.638749,0.657182,0.655801,0.649609,0.611462,0.816147,0.688961,0.816992,0.520015,0.569866,0.606569,0.670388,0.669517,0.799023,0.569866,0.659535,0.816582,0.81592,0.638749,0.602595,0.639454,0.731552,0.678403,0.724484,0.439221,0.569866,0.625862,0.610666,0.657182,0.559347,0.627388,0.500782,0.437104,0.511138,0.573654,0.605949,0.56453,0.549338,0.579422,0.550306,0.569866,0.626806,0.535538,0.53282,0.579422,0.628346,0.629842,0.573654,0.552892,0.724484,0.659535,0.625862,0.596172,0.696797,0.695889,0.55782,0.531566,0.639454,0.77795,0.56009,0.582281,0.638749,0.770828,0.63989,0.637723,0.526551,0.588535,0.569866,0.583132,0.511138,0.590419,0.569866,0.668076,0.608582,0.592395,0.590419,0.659535,0.615524,0.569866,0.606569,0.632226,0.600874,0.685383,0.548405,0.430002,0.430002,0.642346,0.673057,0.580665,0.50464,0.662141,0.467557,0.642161,0.590419,0.584465,0.706156,0.655801,0.722193,0.625862,0.61987,0.655749,0.642346,0.716152,0.815444,0.590419,0.668277,0.597195,0.797789,0.794295,0.64985,0.81592,0.782615,0.569866,0.778926,0.783319,0.584465,0.552892,0.587582,0.713424,0.602595,0.514149,0.569866,0.588362,0.636209,0.673057,0.625862,0.669517,0.670388,0.670388,0.612194,0.569866,0.608422,0.645621,0.635496,0.602595,0.587582,0.815195,0.610666,0.597195,0.569866,0.642061,0.674915,0.79333,0.582281,0.771535,0.587582,0.587582,0.576318,0.584465,0.672746,0.600461,0.605949,0.638374,0.59211,0.629842,0.574354,0.573142,0.639454,0.561474,0.484048,0.511138,0.525032,0.815444,0.625862,0.544268,0.569866,0.636759,0.53282,0.596172,0.614836,0.511138,0.608422,0.685383,0.608582,0.539593,0.606569,0.799707,0.611462,0.803668,0.814116,0.523205,0.523205,0.547835,0.554038,0.629842,0.645593,0.612194,0.547249,0.555775,0.599286,0.524941,0.524941,0.621138,0.563997,0.691361,0.587582,0.603238,0.633641,0.73677,0.622729,0.713424,0.582281,0.632771,0.632771,0.625862,0.748186,0.679969,0.590419,0.545438,0.618977,0.550306,0.618417,0.638749,0.536034,0.496817,0.508195,0.573654,0.740868,0.676301,0.547691,0.623523,0.531566,0.552394,0.691361,0.559347,0.652814,0.484048,0.519271,0.503317,0.490423,0.512583,0.490423,0.597195,0.652814,0.610666,0.626806,0.563346,0.702838,0.569866,0.590419,0.545168,0.555775,0.569866,0.703697,0.590419,0.578655,0.578655,0.548526,0.815686,0.794449,0.77684,0.587582,0.561485,0.584465,0.768058,0.815444,0.592395,0.561485,0.569866,0.606569,0.534678,0.539593,0.629842,0.569866,0.52316,0.569866,0.552394,0.737638,0.580665,0.618417,0.652814,0.593098,0.627783,0.606569,0.596172,0.585641,0.528865,0.780084,0.600807,0.467557,0.569866,0.569866,0.569866,0.64985,0.620338,0.627388,0.626806,0.569866,0.626806,0.627388,0.603238,0.59211,0.520738,0.657182,0.678403,0.559347,0.569866,0.512583,0.579422,0.539593,0.569866,0.606569,0.579422,0.672746,0.636759,0.662141,0.648034,0.626806,0.636759,0.584465,0.60062,0.599286,0.622729,0.569866,0.593327,0.795979,0.592395,0.636759,0.669517,0.770937,0.64985,0.573654,0.701383,0.561485,0.622299,0.579422,0.739258,0.653292,0.611462,0.563997,0.588535,0.636759,0.614654,0.586338,0.519271,0.576409,0.579798,0.500782,0.559846,0.615524,0.81738,0.661513,0.578435,0.56389,0.553396,0.608422,0.516837,0.584465,0.557786,0.538762,0.688961,0.766755,0.610378,0.661015,0.670388,0.520015,0.550337,0.608422,0.642346,0.642161,0.561474,0.577633,0.815195,0.642346,0.552892,0.552892,0.816367,0.814673,0.815686,0.798123,0.816147,0.816992,0.816992,0.81592,0.81316,0.814116,0.815444,0.815195,0.814399,0.814116,0.815444,0.814673,0.814939,0.815195,0.814673,0.814939,0.815195,0.815444,0.812145,0.814673,0.816367,0.809409,0.81288,0.814673,0.814939,0.81592,0.814399,0.814116,0.815686,0.815686,0.816992,0.814399,0.812739,0.814399,0.815195,0.815444,0.813822,0.814399,0.799147,0.814399,0.815686,0.811983,0.814116,0.816992,0.816147,0.814939,0.814116,0.814116,0.816147,0.81592,0.815444,0.815686,0.81592,0.81679,0.814673,0.815195,0.815444,0.814399,0.81592,0.814399,0.81259,0.814939,0.815444,0.814939,0.81592,0.815686,0.815686,0.81592,0.816367,0.81679,0.804767,0.817189,0.815343,0.815686,0.815686,0.815195,0.809752,0.814116,0.813822,0.814399,0.816367,0.813562,0.815444,0.816147,0.815686,0.815444,0.815444,0.814939,0.815195,0.816582,0.815195,0.815195,0.810416,0.815444,0.81592,0.815195,0.804773,0.815444,0.814673,0.815444,0.814939,0.814673,0.814673,0.816367,0.815686,0.815444,0.802329,0.81592,0.815686,0.817189,0.814116,0.813204,0.814399,0.814673,0.81738,0.818097,0.815444,0.814939,0.813519,0.814673,0.814939,0.814939,0.81592,0.816147,0.816582
13528070,0.784275,0.786828,0.812049,0.774861,0.14878,0.784382,0.774425,0.76912,0.772573,0.773215,0.780511,0.76811,0.777095,0.777202,0.782205,0.772302,0.762127,0.766114,0.78775,0.776775,0.811406,0.769534,0.771911,0.769534,0.773215,0.793894,0.778118,0.773215,0.785129,0.784382,0.773215,0.786268,0.786268,0.811464,0.781728,0.775788,0.810901,0.784958,0.771391,0.770025,0.81333,0.788403,0.810901,0.806409,0.775223,0.810901,0.814215,0.775223,0.784958,0.810901,0.78206,0.774284,0.765976,0.785921,0.773682,0.784382,0.782891,0.773827,0.806409,0.771911,0.776361,0.792063,0.773215,0.779742,0.774081,0.813608,0.775314,0.783303,0.776361,0.798903,0.813862,0.782305,0.76811,0.780511,0.771694,0.784168,0.789865,0.786268,0.775555,0.775899,0.769107,0.788846,0.788846,0.782232,0.776361,0.777736,0.780182,0.785513,0.775223,0.773215,0.786828,0.781245,0.777016,0.788363,0.783303,0.778633,0.777016,0.773215,0.777736,0.784176,0.76935,0.813366,0.773215,0.776798,0.770924,0.771996,0.77306,0.773827,0.781453,0.784382,0.781453,0.780511,0.773215,0.807718,0.786268,0.790366,0.797576,0.77849,0.776361,0.782696,0.7692,0.771911,0.770025,0.775376,0.770025,0.770924,0.771694,0.773215,0.784382,0.767411,0.776257,0.768068,0.777608,0.781159,0.777756,0.776238,0.775555,0.779358,0.773215,0.78228,0.781728,0.784382,0.784176,0.783269,0.778118,0.813118,0.789452,0.814071,0.76811,0.773215,0.777506,0.786405,0.786268,0.816261,0.773215,0.784734,0.813608,0.803655,0.781728,0.777016,0.781826,0.797576,0.78769,0.796095,0.761246,0.773215,0.779979,0.778017,0.784382,0.772073,0.780182,0.76633,0.761086,0.767276,0.773635,0.777429,0.772631,0.771021,0.774284,0.771121,0.773215,0.780105,0.76962,0.76935,0.774284,0.784483,0.780511,0.773635,0.771391,0.796095,0.784734,0.779979,0.776238,0.790817,0.790656,0.771911,0.769227,0.781826,0.796658,0.772153,0.77461,0.781728,0.795804,0.781887,0.781586,0.768737,0.775334,0.773215,0.774708,0.767276,0.775555,0.773215,0.786043,0.777756,0.775788,0.775555,0.784734,0.778633,0.773215,0.777506,0.780833,0.776806,0.788846,0.770924,0.760558,0.760558,0.782232,0.786828,0.774425,0.76668,0.785129,0.763477,0.782205,0.775555,0.774861,0.792517,0.784176,0.795628,0.779979,0.779193,0.784168,0.782232,0.794425,0.812328,0.775555,0.786074,0.776361,0.791113,0.814553,0.783303,0.812862,0.81068,0.773215,0.809546,0.810901,0.774861,0.771391,0.775223,0.793894,0.777016,0.767557,0.773215,0.775314,0.781377,0.786828,0.779979,0.786268,0.786405,0.786405,0.77821,0.773215,0.777736,0.782696,0.781279,0.777016,0.775223,0.812049,0.778017,0.776361,0.773215,0.782191,0.787125,0.814215,0.77461,0.796155,0.775223,0.775223,0.773933,0.774861,0.786779,0.776756,0.777429,0.781676,0.775755,0.780511,0.773713,0.773578,0.781826,0.772301,0.76486,0.767276,0.76859,0.812328,0.779979,0.770499,0.773215,0.781453,0.76935,0.776238,0.778545,0.767276,0.777736,0.788846,0.777756,0.770025,0.777506,0.816516,0.778118,0.818033,0.810841,0.768415,0.768415,0.770865,0.771511,0.780511,0.782692,0.77821,0.770805,0.771694,0.776613,0.768582,0.768582,0.779358,0.772573,0.789865,0.775223,0.777095,0.781025,0.791989,0.779566,0.793894,0.77461,0.780907,0.780907,0.779979,0.801327,0.787946,0.775555,0.770619,0.779078,0.771121,0.779005,0.781728,0.769669,0.765976,0.767005,0.773635,0.788133,0.787348,0.77085,0.779671,0.769227,0.771339,0.789865,0.772073,0.783736,0.76486,0.768039,0.766559,0.765412,0.767411,0.765412,0.776361,0.783736,0.778017,0.780105,0.772503,0.791905,0.773215,0.775555,0.770591,0.771694,0.773215,0.792063,0.775555,0.774197,0.774197,0.770937,0.812599,0.802574,0.808921,0.775223,0.772302,0.774861,0.806409,0.812328,0.775788,0.772302,0.773215,0.777506,0.769534,0.770025,0.780511,0.773215,0.76841,0.773215,0.771339,0.798903,0.774425,0.779005,0.783736,0.775871,0.780235,0.777506,0.776238,0.774997,0.768962,0.797865,0.776798,0.763477,0.773215,0.773215,0.773215,0.783303,0.779254,0.780182,0.780105,0.773215,0.780105,0.780182,0.777095,0.775755,0.768179,0.784382,0.78769,0.772073,0.773215,0.767411,0.774284,0.770025,0.773215,0.777506,0.774284,0.786779,0.781453,0.785129,0.715214,0.780105,0.781453,0.774861,0.776775,0.776613,0.779566,0.773215,0.775899,0.803655,0.775788,0.781453,0.786268,0.807212,0.783303,0.773635,0.79164,0.772302,0.77951,0.774284,0.799264,0.783806,0.778118,0.772573,0.775334,0.781453,0.778522,0.775078,0.768039,0.773943,0.774327,0.76633,0.772127,0.778633,0.81451,0.785033,0.774172,0.772562,0.771444,0.777736,0.767809,0.774861,0.771907,0.769942,0.789452,0.806052,0.777981,0.784958,0.786405,0.76811,0.771124,0.777736,0.782232,0.782205,0.772301,0.774081,0.812049,0.782232,0.771391,0.771391,0.813366,0.811464,0.812599,0.804052,0.813118,0.814071,0.814071,0.812862,0.812328,0.810841,0.812328,0.812049,0.811158,0.810841,0.812328,0.811464,0.811761,0.812049,0.80868,0.811761,0.812049,0.812328,0.810137,0.811464,0.813366,0.810751,0.812049,0.811464,0.811761,0.812862,0.811158,0.810841,0.812599,0.812599,0.81288,0.811158,0.810752,0.811158,0.812049,0.808817,0.810514,0.811158,0.805325,0.811158,0.812599,0.811158,0.810841,0.814071,0.813118,0.811761,0.810841,0.810841,0.813118,0.812862,0.812328,0.812599,0.812862,0.813842,0.811464,0.812049,0.812328,0.811158,0.81047,0.811158,0.811761,0.809018,0.812328,0.809018,0.812862,0.812599,0.812599,0.80436,0.813366,0.811385,0.809001,0.80927,0.81451,0.803972,0.812599,0.812049,0.808937,0.810841,0.810514,0.808331,0.813366,0.811607,0.812328,0.813118,0.812599,0.812328,0.812328,0.811761,0.812049,0.813608,0.812049,0.812049,0.810752,0.812328,0.812862,0.812049,0.813366,0.812328,0.80868,0.812328,0.811761,0.811464,0.811464,0.813366,0.812599,0.812328,0.807228,0.812862,0.812599,0.811054,0.810841,0.809826,0.811158,0.811464,0.81451,0.815323,0.809663,0.811761,0.810176,0.811464,0.811761,0.811761,0.812862,0.813118,0.813608
13057717,0.681978,0.695144,0.808342,0.626886,0.787643,0.366995,0.317879,0.338229,0.611826,0.616117,0.661221,0.580378,0.640933,0.641591,0.670768,0.374577,0.533481,0.565373,0.699721,0.638961,0.789048,0.590721,0.607333,0.590721,0.616117,0.727957,0.647157,0.616117,0.68646,0.682542,0.616117,0.69232,0.69232,0.807622,0.668114,0.632793,0.787643,0.68557,0.603767,0.59422,0.794238,0.702909,0.787643,0.774268,0.629203,0.787643,0.796535,0.629203,0.68557,0.787643,0.669964,0.623151,0.564309,0.69055,0.619211,0.682542,0.674538,0.620163,0.774268,0.607333,0.636387,0.719947,0.616117,0.656778,0.62183,0.810252,0.629784,0.676776,0.636387,0.748197,0.795624,0.67132,0.580378,0.661221,0.605851,0.681412,0.709884,0.69232,0.631317,0.633489,0.58765,0.705045,0.705045,0.670913,0.636387,0.644851,0.659331,0.688453,0.629203,0.616117,0.695144,0.665396,0.640448,0.702715,0.676776,0.650247,0.640448,0.616117,0.644851,0.681453,0.589403,0.809957,0.616117,0.639101,0.600533,0.607916,0.615086,0.620163,0.66657,0.682542,0.66657,0.661221,0.616117,0.797291,0.69232,0.712223,0.743069,0.649392,0.636387,0.673467,0.588319,0.607333,0.59422,0.630177,0.59422,0.600533,0.605851,0.616117,0.682542,0.57519,0.635741,0.580067,0.64407,0.664915,0.644972,0.63562,0.631317,0.654534,0.616117,0.67118,0.668114,0.682542,0.681453,0.676588,0.647157,0.809653,0.707939,0.810818,0.580378,0.616117,0.643448,0.693014,0.69232,0.801637,0.616117,0.684399,0.810252,0.80934,0.668114,0.640448,0.668662,0.743069,0.699426,0.737148,0.526067,0.616117,0.658158,0.646553,0.682542,0.608441,0.659331,0.56703,0.524709,0.574186,0.618898,0.64298,0.612215,0.601205,0.623151,0.601902,0.616117,0.658883,0.591333,0.589403,0.623151,0.683078,0.661221,0.618898,0.603767,0.737148,0.684399,0.658158,0.63562,0.714305,0.713565,0.607333,0.588515,0.668662,0.774235,0.608982,0.625266,0.668114,0.76885,0.669001,0.667318,0.584971,0.629912,0.616117,0.625897,0.574186,0.631317,0.616117,0.691172,0.644972,0.632793,0.631317,0.684399,0.650247,0.616117,0.643448,0.663061,0.639152,0.705045,0.600533,0.520179,0.520179,0.670913,0.695144,0.62407,0.569687,0.68646,0.544577,0.670768,0.631317,0.626886,0.721966,0.681453,0.735237,0.658158,0.653564,0.681412,0.670913,0.730216,0.808685,0.631317,0.691332,0.636387,0.809653,0.797397,0.676776,0.80934,0.787021,0.616117,0.783771,0.787643,0.626886,0.603767,0.629203,0.727957,0.640448,0.57628,0.616117,0.629784,0.666143,0.695144,0.658158,0.69232,0.693014,0.693014,0.647713,0.616117,0.644851,0.673467,0.665591,0.640448,0.629203,0.808342,0.646553,0.636387,0.616117,0.670691,0.69663,0.796535,0.625266,0.769571,0.629203,0.629203,0.62086,0.626886,0.694896,0.638841,0.64298,0.667823,0.63258,0.661221,0.619413,0.618522,0.668662,0.609988,0.555623,0.574186,0.583901,0.808685,0.658158,0.597563,0.616117,0.66657,0.589403,0.63562,0.649722,0.574186,0.644851,0.705045,0.644972,0.59422,0.643448,0.802251,0.647157,0.805825,0.806855,0.582616,0.582616,0.600123,0.604595,0.661221,0.673445,0.647713,0.599702,0.605851,0.637957,0.583837,0.583837,0.654534,0.611826,0.709884,0.629203,0.640933,0.664155,0.754831,0.655753,0.727957,0.625266,0.663483,0.663483,0.658158,0.757153,0.700684,0.631317,0.598402,0.652882,0.601902,0.652454,0.668114,0.591685,0.564309,0.572145,0.618898,0.74295,0.69774,0.60002,0.656362,0.588515,0.603407,0.709884,0.608441,0.679103,0.555623,0.579857,0.568774,0.559945,0.57519,0.559945,0.636387,0.679103,0.646553,0.658883,0.611351,0.719243,0.616117,0.631317,0.598208,0.605851,0.616117,0.719947,0.631317,0.622584,0.622584,0.60062,0.809017,0.789145,0.781939,0.629203,0.609996,0.626886,0.774268,0.808685,0.632793,0.609996,0.616117,0.643448,0.590721,0.59422,0.661221,0.616117,0.582585,0.616117,0.603407,0.748197,0.62407,0.652454,0.679103,0.633318,0.659635,0.643448,0.63562,0.627759,0.586604,0.776493,0.639101,0.544577,0.616117,0.616117,0.616117,0.676776,0.653922,0.659331,0.658883,0.616117,0.658883,0.659331,0.640933,0.63258,0.580885,0.682542,0.699426,0.608441,0.616117,0.57519,0.623151,0.59422,0.616117,0.643448,0.623151,0.694896,0.66657,0.68646,0.675354,0.658883,0.66657,0.626886,0.638961,0.637957,0.655753,0.616117,0.633489,0.790875,0.632793,0.66657,0.69232,0.776775,0.676776,0.618898,0.718052,0.609996,0.655423,0.623151,0.749567,0.679479,0.647157,0.611826,0.629912,0.66657,0.649584,0.628277,0.579857,0.620927,0.623428,0.56703,0.608804,0.650247,0.811354,0.685963,0.622422,0.611748,0.604131,0.644851,0.578155,0.626886,0.607308,0.593627,0.707939,0.773136,0.646334,0.68557,0.693014,0.580378,0.601924,0.644851,0.670913,0.670768,0.609988,0.62183,0.808342,0.670913,0.603767,0.603767,0.809957,0.805513,0.809017,0.792504,0.809653,0.810818,0.80884,0.80934,0.806521,0.802352,0.808685,0.808342,0.807245,0.806855,0.804486,0.807622,0.807988,0.808342,0.807622,0.807988,0.808342,0.808685,0.80525,0.807622,0.809957,0.805406,0.808342,0.807622,0.807988,0.807232,0.807245,0.806855,0.807018,0.809017,0.80884,0.807245,0.803978,0.807245,0.808342,0.808685,0.806451,0.807245,0.795521,0.807245,0.809017,0.807245,0.806855,0.810818,0.809653,0.805764,0.806855,0.806855,0.809653,0.807232,0.806659,0.807018,0.80934,0.796845,0.807622,0.806289,0.808685,0.807245,0.805254,0.807245,0.807988,0.807988,0.808685,0.807988,0.80934,0.809017,0.809017,0.807232,0.809957,0.810539,0.801383,0.81109,0.811354,0.809017,0.809017,0.808342,0.803015,0.806855,0.806451,0.807245,0.809957,0.807126,0.808685,0.809653,0.806882,0.808685,0.808685,0.805764,0.808342,0.79606,0.808342,0.808342,0.803836,0.808685,0.80934,0.808342,0.809957,0.806659,0.807622,0.806659,0.807988,0.807622,0.807622,0.809957,0.806882,0.808685,0.797363,0.80934,0.809017,0.809257,0.806855,0.805601,0.807245,0.807622,0.811354,0.798714,0.808685,0.807988,0.806034,0.807622,0.807988,0.807988,0.80934,0.795454,0.791533
13308163,0.67441,0.688564,0.81126,0.614551,0.786323,0.675017,0.611464,0.57138,0.046892,0.564946,0.087425,0.5263,0.592329,0.318476,0.662313,0.595989,0.510517,0.546436,0.693471,0.627759,0.787784,0.574679,0.593054,0.574679,0.602728,0.723585,0.636696,0.602728,0.679235,0.675017,0.602728,0.685533,0.685533,0.810644,0.659444,0.621019,0.786323,0.678277,0.589118,0.578558,0.793173,0.696884,0.786323,0.772378,0.61709,0.786323,0.795555,0.61709,0.678277,0.786323,0.661444,0.610455,0.545246,0.683631,0.606129,0.675017,0.666386,0.607175,0.772378,0.593054,0.624949,0.71507,0.602728,0.647157,0.609005,0.8129,0.617726,0.668802,0.624949,0.745003,0.794611,0.66291,0.563186,0.651978,0.591419,0.673801,0.704341,0.685533,0.619404,0.621781,0.571271,0.69917,0.69917,0.66247,0.624949,0.634185,0.649928,0.681378,0.61709,0.602728,0.688564,0.656502,0.629383,0.696676,0.668802,0.640059,0.629383,0.602728,0.634185,0.673845,0.573217,0.793482,0.602728,0.627913,0.585545,0.593696,0.601594,0.607175,0.657772,0.675017,0.657772,0.651978,0.564946,0.799192,0.685533,0.706837,0.73959,0.63913,0.624949,0.149836,0.572014,0.593054,0.578558,0.618157,0.578558,0.585545,0.591419,0.602728,0.675017,0.557405,0.624242,0.56284,0.633333,0.655981,0.634316,0.62411,0.619404,0.644721,0.602728,0.662759,0.659444,0.675017,0.673845,0.668599,0.636696,0.812385,0.702263,0.813386,0.563186,0.602728,0.632656,0.686278,0.685533,0.800837,0.602728,0.677017,0.8129,0.812116,0.659444,0.629383,0.660036,0.73959,0.693155,0.733328,0.502099,0.602728,0.648655,0.636038,0.675017,0.594276,0.649928,0.54829,0.500554,0.556285,0.605785,0.632144,0.598434,0.586287,0.610455,0.587057,0.602728,0.649443,0.575358,0.573217,0.610455,0.675595,0.651978,0.605785,0.589118,0.733328,0.677017,0.648655,0.62411,0.709059,0.70827,0.593054,0.572231,0.660036,0.776227,0.594871,0.612776,0.659444,0.770155,0.660403,0.658582,0.568295,0.617866,0.602728,0.613467,0.556285,0.619404,0.602728,0.6843,0.634316,0.621019,0.619404,0.677017,0.640059,0.602728,0.632656,0.653972,0.627968,0.69917,0.585545,0.495394,0.495394,0.66247,0.688564,0.611464,0.551261,0.679235,0.523066,0.662313,0.619404,0.614551,0.717218,0.673845,0.731305,0.648655,0.643666,0.673801,0.66247,0.725983,0.811554,0.619404,0.684472,0.624949,0.812385,0.796449,0.668802,0.812116,0.785677,0.602728,0.782294,0.786323,0.614551,0.589118,0.61709,0.723585,0.629383,0.558621,0.602728,0.617726,0.657311,0.688564,0.648655,0.685533,0.686278,0.686278,0.637302,0.602728,0.634185,0.66523,0.656713,0.629383,0.61709,0.81126,0.636038,0.624949,0.602728,0.66223,0.690158,0.795555,0.612776,0.770855,0.61709,0.61709,0.60794,0.614551,0.688298,0.627629,0.632144,0.659129,0.620786,0.651978,0.606351,0.605372,0.660036,0.59598,0.535503,0.556285,0.567106,0.791378,0.648655,0.58226,0.602728,0.657772,0.573217,0.62411,0.639489,0.556285,0.634185,0.69917,0.634316,0.578558,0.632656,0.801473,0.636696,0.805165,0.809988,0.565677,0.565677,0.585092,0.590032,0.651978,0.665206,0.637302,0.584626,0.591419,0.626664,0.567034,0.567034,0.644721,0.598005,0.704341,0.61709,0.629912,0.655157,0.755251,0.646044,0.723585,0.612776,0.654429,0.654429,0.648655,0.754435,0.694502,0.619404,0.583188,0.642925,0.587057,0.64246,0.659444,0.575749,0.545246,0.554007,0.605785,0.743004,0.691348,0.584977,0.646706,0.572231,0.58872,0.704341,0.594276,0.671312,0.535503,0.562605,0.550241,0.540355,0.557405,0.540355,0.624949,0.671312,0.636038,0.649443,0.597482,0.714321,0.602728,0.619404,0.582973,0.591419,0.602728,0.71507,0.619404,0.609833,0.609833,0.585641,0.811839,0.791607,0.780385,0.61709,0.595989,0.614551,0.772378,0.811554,0.621019,0.595989,0.602728,0.632656,0.574679,0.578558,0.651978,0.602728,0.565642,0.602728,0.58872,0.745003,0.611464,0.64246,0.671312,0.621593,0.650258,0.632656,0.62411,0.615508,0.570109,0.778385,0.627913,0.523066,0.602728,0.602728,0.602728,0.668802,0.644055,0.649928,0.649443,0.602728,0.649443,0.649928,0.629912,0.620786,0.56375,0.675017,0.693155,0.594276,0.602728,0.557405,0.610455,0.578558,0.602728,0.632656,0.610455,0.688298,0.657772,0.679235,0.667267,0.649443,0.657772,0.614551,0.627759,0.626664,0.646044,0.602728,0.621781,0.793215,0.621019,0.657772,0.685533,0.774997,0.668802,0.605785,0.713052,0.595989,0.645687,0.610455,0.746448,0.671717,0.636696,0.598005,0.617866,0.657772,0.639338,0.616076,0.562605,0.608014,0.61076,0.54829,0.594676,0.640059,0.781414,0.678701,0.609655,0.597919,0.589519,0.634185,0.56071,0.614551,0.593026,0.577902,0.218111,0.574057,0.6358,0.678277,0.686278,0.563186,0.587082,0.634185,0.66247,0.662313,0.59598,0.609005,0.81126,0.66247,0.589118,0.589118,0.812646,0.810644,0.809477,0.795059,0.812385,0.813386,0.813386,0.807579,0.806439,0.809988,0.811554,0.81126,0.809483,0.809988,0.811554,0.810644,0.810957,0.81126,0.810644,0.810957,0.804338,0.811554,0.807393,0.810644,0.811864,0.807262,0.810444,0.810644,0.810957,0.812116,0.810321,0.809988,0.811037,0.809477,0.813386,0.810321,0.808092,0.80522,0.81126,0.811554,0.808788,0.807785,0.798215,0.810321,0.80724,0.810321,0.809988,0.812623,0.808603,0.810957,0.809988,0.809988,0.812385,0.809785,0.810745,0.811839,0.812116,0.813146,0.810644,0.810444,0.811554,0.810321,0.812116,0.810321,0.810134,0.808493,0.811554,0.804613,0.812116,0.809477,0.809477,0.807579,0.808226,0.813146,0.800764,0.810037,0.813096,0.809477,0.811839,0.81126,0.80343,0.809988,0.809643,0.806943,0.811864,0.809063,0.809159,0.812385,0.811839,0.811554,0.811554,0.810957,0.81126,0.8129,0.81126,0.81126,0.806474,0.810745,0.811321,0.810444,0.812646,0.811554,0.810644,0.810745,0.810957,0.810644,0.808145,0.812646,0.808672,0.811554,0.795931,0.809447,0.811037,0.81362,0.809988,0.808916,0.810321,0.810644,0.813847,0.8147,0.806892,0.810957,0.809286,0.810644,0.810957,0.810957,0.812116,0.812385,0.8129


In [69]:
data_matrix = np.array(data_matrix)

gb_raw_shape = data_matrix.shape
print(gb_raw_shape)

gb_data = []
for i in range(gb_raw_shape[1]):
    gb_data.extend(data_matrix[:, i, :])
gb_data = np.array(gb_data)
print(gb_data.shape)

project_numbers = np.array(list(range(1, gb_raw_shape[0] + 1)) * gb_raw_shape[1])

project_numbers = np.array(list(range(1, gb_raw_shape[0] + 1)) * gb_raw_shape[1])

# get the projects for lowest predictions for each publication with distance matrix
for num_top in range(10, 0, -1):
    project_numbers_pred = []
    for i in range(len(train_pub_data), distance_matrix.shape[1]):
        project_numbers_pred.append(list(np.argsort(distance_matrix[:, i] + 1))[:num_top])

    project_lists = []
    for i in range(0, gb_data.shape[0], gb_raw_shape[0]):
        pub_belongs = gb_data[i:i + gb_raw_shape[0], 0] * project_numbers[i:i + gb_raw_shape[0]]
        project = sorted(list(pub_belongs[pub_belongs != 0].astype(int)), reverse=True)
        project_lists.append(project)

    project_lists_test = project_lists[len(train_pub_data):]

    # calculate accuracy
    # use y_test as mask for project_numbers_test
    accuracy_list = []
    for i, project_list in enumerate(list(project_lists_test)):
        ratio = len(set(project_numbers_pred[i]) & set(project_list)) / len(set(project_list))
        accuracy_list.append(ratio)

    accuracy = sum(accuracy_list) / len(accuracy_list)
    print(accuracy)

(225, 635, 2)
(142875, 2)
0.16279069767441862
0.14728682170542637
0.13178294573643412
0.11627906976744186
0.09302325581395349
0.07751937984496124
0.06201550387596899
0.05426356589147287
0.03875968992248062
0.023255813953488372
