In [1]:
import pandas as pd
import json
import LLDA.model.labeled_lda as llda
import numpy as np
from sklearn.metrics.pairwise import cosine_similarity
from scipy.spatial.distance import jensenshannon

In [2]:
with open('dim_sample.json') as f:
    all_data = json.load(f)

def get_unique_dis(data):
    disciplines = set()
    for pro_id in data.keys():
        disciplines.update(data[pro_id]['disciplines'])
    return disciplines

In [3]:
split = 180
train_data = {k: all_data[k] for k in list(all_data.keys())[:split]}
test_data = {k: all_data[k] for k in list(all_data.keys())[split:]}

train_project_data = {}
train_pub_data = []
for pro_id in train_data.keys():
    train_project_data[pro_id] = (train_data[pro_id]['title'], train_data[pro_id]['disciplines'])
    for pub_id in train_data[pro_id]['publications'].keys():
        train_pub_data.append((pub_id, train_data[pro_id]['publications'][pub_id]['title'], train_data[pro_id]['publications'][pub_id]['disciplines']))

test_project_data = {}
test_pub_data = []
for pro_id in test_data.keys():
    test_project_data[pro_id] = (test_data[pro_id]['title'], test_data[pro_id]['disciplines'])
    for pub_id in test_data[pro_id]['publications'].keys():
        test_pub_data.append((pub_id, test_data[pro_id]['publications'][pub_id]['title'], test_data[pro_id]['publications'][pub_id]['disciplines']))

print(len(train_project_data), len(train_pub_data))
print(len(test_project_data), len(test_pub_data))
print(len(get_unique_dis(train_data)), len(get_unique_dis({pub[0]: {'disciplines': pub[2]} for pub in train_pub_data})))

180 506
45 129
170 170


In [4]:
print(train_project_data[list(train_project_data.keys())[0]])
print(train_pub_data[0][1:])

('Quantifying trophic niches to measure the resilience of marine predators', ['4101', '4104', '3103'])
('Towards unlocking the trophic roles of rarely encountered squid: Opportunistic samples of Taningia danae and a Chiroteuthis aff. veranii reveal that the Southern Ocean top predators are nutrient links connecting deep-sea and shelf-slope environments', ['3103'])


In [5]:
# # load from disk
# llda_model_project = llda.LldaModel()
# llda_model_project.load_model_from_dir("LLDA/data_models/pro_abstracts_disciplines", load_derivative_properties=False)
# print("llda_model_project", llda_model_project)
# # print("Top-5 terms of topic 'virus': ", llda_model_project.top_terms_of_topic("virus", 5, False))
# print("Doc-Topic Matrix: \n", llda_model_project.theta)
# print("Topic-Term Matrix: \n", llda_model_project.beta)

In [6]:
llda_model_project = llda.LldaModel(labeled_documents=train_project_data.values())
print(llda_model_project)
llda_model_pub = llda.LldaModel(labeled_documents=[(pub[1], pub[2]) for pub in train_pub_data])
print(llda_model_pub)


Labeled-LDA Model:
	K = 171
	M = 180
	T = 1251
	WN = 2120
	LN = 281
	alpha = 0.29239766081871343
	eta = 0.001
	perplexity = 92.97554193238017
	

Labeled-LDA Model:
	K = 171
	M = 506
	T = 2987
	WN = 6374
	LN = 704
	alpha = 0.29239766081871343
	eta = 0.001
	perplexity = 200.9591573235818
	


In [7]:
# training
llda_model_project.training(iteration=10, log=True)
# while True:
#     print("iteration %s sampling..." % (llda_model.iteration + 1))
#     llda_model.training(1)
#     print("after iteration: %s, perplexity: %s" % (llda_model.iteration, llda_model.perplexity()))
#     print("delta beta: %s" % llda_model.delta_beta)
#     if llda_model.is_convergent(method="beta", delta=0.01):
#         break

after iteration: 0, perplexity: 92.97554193238017
gibbs sample count:  2120
after iteration: 1, perplexity: 37.85641536989131
gibbs sample count:  2120
after iteration: 2, perplexity: 35.307315196064025
gibbs sample count:  2120
after iteration: 3, perplexity: 34.293533709202784
gibbs sample count:  2120
after iteration: 4, perplexity: 33.22384783554604
gibbs sample count:  2120
after iteration: 5, perplexity: 33.15751964543431
gibbs sample count:  2120
after iteration: 6, perplexity: 33.09529453406034
gibbs sample count:  2120
after iteration: 7, perplexity: 33.20953333061363
gibbs sample count:  2120
after iteration: 8, perplexity: 32.20403454618368
gibbs sample count:  2120
after iteration: 9, perplexity: 32.11370576856241
gibbs sample count:  2120


In [8]:
llda_model_pub.training(iteration=10, log=True)

after iteration: 0, perplexity: 200.9591573235818
gibbs sample count:  6374
after iteration: 1, perplexity: 109.8484224831134
gibbs sample count:  6374
after iteration: 2, perplexity: 105.59155652386359
gibbs sample count:  6374
after iteration: 3, perplexity: 100.94317371357387
gibbs sample count:  6374
after iteration: 4, perplexity: 97.99581354987028
gibbs sample count:  6374
after iteration: 5, perplexity: 96.08697425550125
gibbs sample count:  6374
after iteration: 6, perplexity: 96.54776733223282
gibbs sample count:  6374
after iteration: 7, perplexity: 95.2943263298371
gibbs sample count:  6374
after iteration: 8, perplexity: 94.20039087912943
gibbs sample count:  6374
after iteration: 9, perplexity: 92.32390411357356
gibbs sample count:  6374


In [9]:
# # update
# print("before updating: ", llda_model)
# update_labeled_documents = [("new example test example test example test example test", ["example", "test"])]
# llda_model.update(labeled_documents=update_labeled_documents)
# print("after updating: ", llda_model)

# # train again
# # llda_model.training(iteration=10, log=True)
# while True:
#     print("iteration %s sampling..." % (llda_model.iteration + 1))
#     llda_model.training(1)
#     print("after iteration: %s, perplexity: %s" % (llda_model.iteration, llda_model.perplexity()))
#     print("delta beta: %s" % llda_model.delta_beta)
#     if llda_model.is_convergent(method="beta", delta=0.01):
#         break

In [10]:
# inference
# note: the result topics may be different for difference training, because gibbs sampling is a random algorithm
document = list(test_project_data.values())[0][0]
print(document)

topics = llda_model_project.inference(document=document, iteration=30, times=10)
# print sorted topics
sorted(topics, key=lambda x: x[0])

Center of Excellence in Complex Disease Genetics-from Discovery to Precision Medicine


[('3001', 0.005414771496642827),
 ('3002', 0.005414771496642827),
 ('3003', 0.005414771496642827),
 ('3004', 0.005414771496642827),
 ('3005', 0.005414771496642827),
 ('3006', 0.005414771496642827),
 ('3007', 0.005414771496642827),
 ('3008', 0.005414771496642827),
 ('3009', 0.005414771496642827),
 ('3101', 0.005414771496642827),
 ('3102', 0.005414771496642827),
 ('3103', 0.005414771496642827),
 ('3104', 0.005414771496642827),
 ('3105', 0.005414771496642827),
 ('3106', 0.005414771496642827),
 ('3107', 0.005414771496642827),
 ('3108', 0.005414771496642827),
 ('3109', 0.005414771496642827),
 ('3201', 0.005414771496642827),
 ('3202', 0.005414771496642827),
 ('3203', 0.005414771496642827),
 ('3204', 0.005414771496642827),
 ('3205', 0.005414771496642827),
 ('3206', 0.005414771496642827),
 ('3207', 0.005414771496642827),
 ('3208', 0.005414771496642827),
 ('3209', 0.005414771496642827),
 ('3210', 0.005414771496642827),
 ('3211', 0.005414771496642827),
 ('3212', 0.005414771496642827),
 ('3213', 

In [11]:
documents = list(test_project_data.values())
project_matrix_test = np.zeros((len(documents), llda_model_project.K))

for i, (document, _) in enumerate(documents):
    topics = llda_model_project.inference(document=document, iteration=100, times=10)
    sorted_topics = sorted(topics, key=lambda x: x[0])
    for j, (topic, prob) in enumerate(sorted_topics):
        project_matrix_test[i, j] = prob

project_matrix_test

array([[0.00541477, 0.00541477, 0.00541477, ..., 0.00541477, 0.00541477,
        0.06097033],
       [0.00551694, 0.00551694, 0.00551694, ..., 0.00551694, 0.00551694,
        0.04325279],
       [0.00562303, 0.00562303, 0.00562303, ..., 0.00562303, 0.00562303,
        0.02100765],
       ...,
       [0.00541477, 0.00541477, 0.00541477, ..., 0.00541477, 0.00541477,
        0.06652588],
       [0.00551694, 0.00551694, 0.00551694, ..., 0.00551694, 0.00551694,
        0.05457354],
       [0.00562303, 0.00562303, 0.00562303, ..., 0.00754611, 0.00562303,
        0.02293072]])

In [12]:
documents = [(pub[1], pub[2]) for pub in test_pub_data]
pub_matrix_test = np.zeros((len(documents), llda_model_pub.K))

for i, (document, _) in enumerate(documents):
    topics = llda_model_pub.inference(document=document, iteration=100, times=10)
    sorted_topics = sorted(topics, key=lambda x: x[0])
    for j, (topic, prob) in enumerate(sorted_topics):
        pub_matrix_test[i, j] = prob

pub_matrix_test

array([[0.00471609, 0.00471609, 0.00471609, ..., 0.00471609, 0.00471609,
        0.04342577],
       [0.00531632, 0.00531632, 0.00531632, ..., 0.00531632, 0.00531632,
        0.01804359],
       [0.00495589, 0.00495589, 0.00495589, ..., 0.00495589, 0.00495589,
        0.02021013],
       ...,
       [0.00487329, 0.00487329, 0.00487329, ..., 0.00487329, 0.00487329,
        0.01820663],
       [0.00643275, 0.0047934 , 0.0047934 , ..., 0.0047934 , 0.0047934 ,
        0.0195475 ],
       [0.00464123, 0.00464123, 0.00622853, ..., 0.00464123, 0.00464123,
        0.04273647]])

In [13]:
project_matrix = np.concatenate((llda_model_project.theta, project_matrix_test))
pub_matrix = np.concatenate((llda_model_pub.theta, pub_matrix_test))

distance_matrix = np.zeros((len(project_matrix), len(pub_matrix)))

for i in range(len(project_matrix)):
    for j in range(len(pub_matrix)):
        distance_matrix[i, j] = 1 - cosine_similarity([project_matrix[i]], [pub_matrix[j]])[0][0]

In [14]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
# create a dataframe with row indices as project ids and column indices as publication ids
# if publication is in project, then 1, else 0
# if publication date is before project start date, then 0, else 1
# ratio of intersection of organisations from project and publication to organisations from publication
# ratio of intersection of authors from project and publication to authors from publication

all_data = {**train_data, **test_data}
pub_data = []
for pro_id in all_data.keys():
    for pub_id in all_data[pro_id]['publications'].keys():
        pub_data.append((pub_id, all_data[pro_id]['publications'][pub_id]))

data_matrix = [[0.] * len(pub_data) for _ in range(len(all_data))]
for i, pro_id in enumerate(all_data.keys()):
    for j, pub_id in enumerate([pub[0] for pub in pub_data]):
        belongs = 1 if pub_id in all_data[pro_id]['publications'].keys() else 0
        distance = distance_matrix[i, j]
        data_matrix[i][j] = [belongs, distance]

df = pd.DataFrame(distance_matrix, index=all_data.keys(), columns=[pub[0] for pub in pub_data])
df.to_csv('distance_dim_title.csv')
df.head()

Unnamed: 0,10.3389/fmars.2023.1254461,10.1007/978-3-031-49133-7_8,10.1007/978-3-031-43619-2_15,10.1080/11663081.2023.2246863,10.1177/03057356231165327,10.1016/j.jconrel.2024.05.037,10.1007/s13346-024-01618-6,10.1002/smll.202303682,10.1371/journal.pone.0298895,10.1007/s00334-024-00992-y,10.1038/s41598-023-44445-4,10.1101/2023.09.15.557939,10.1016/j.jasrep.2023.104204,10.1016/j.palaeo.2023.111655,10.1007/jhep05(2024)154,10.1140/epjc/s10052-024-12711-y,10.1140/epjc/s10052-024-12416-2,10.1140/epjc/s10052-024-12415-3,10.1007/jhep02(2024)124,10.1007/jhep11(2023)103,10.1007/jhep06(2023)086,10.1093/iob/obad026,10.1007/s00359-023-01629-7,10.1101/2023.03.11.531676,10.1093/mnras/stae997,10.1093/mnras/stae616,10.1051/0004-6361/202348958,10.1093/mnras/stad3163,10.1093/mnras/stad2183,10.1101/2024.01.14.574481,10.1007/s40313-024-01095-9,10.1109/tpwrs.2023.3321700,10.1109/tits.2024.3392914,10.1007/978-981-97-0989-2_24,10.1109/tsc.2023.3332701,10.1007/978-3-031-48424-7_15,10.1007/978-3-031-48424-7_13,10.1145/3631353,10.1145/3629517,10.1109/icdcs57875.2023.00111,10.1109/icws60048.2023.00056,10.1109/icws60048.2023.00031,10.1109/icws60048.2023.00068,10.1109/tsc.2023.3307143,10.1145/3600232,10.1109/mic.2023.3267266,10.1109/tsc.2023.3241975,10.1109/tmc.2022.3230856,10.1007/978-3-031-20984-0_9,10.1109/tsc.2022.3160469,10.3389/fneur.2023.1182561,10.1038/s41598-024-57498-w,10.1016/j.jmrt.2023.11.014,10.1016/j.jmst.2023.05.020,10.1016/j.fuel.2023.130187,10.1017/9781009297349,10.1007/s11229-023-04282-4,10.3390/rel14060758,10.1002/smsc.202400096,10.1016/j.actpsy.2024.104252,10.1080/02691728.2024.2326828,10.5964/ejop.12031,10.1111/jopy.12805,10.1109/lsp.2023.3277792,10.21203/rs.3.rs-3644422/v1,10.1016/j.renene.2024.120101,10.1093/rheumatology/kead301,10.1097/mlr.0000000000002000,10.1111/tmi.13827,10.1063/5.0167167,10.1021/acsami.2c19376,10.1021/acsanm.2c05047,10.1101/2024.05.21.595254,10.1038/s41467-024-47964-4,10.1093/jb/mvae021,10.1016/j.neuron.2024.01.014,10.1016/j.isci.2023.107385,10.1016/j.peptides.2023.171051,10.3389/fphar.2023.1138666,10.3389/fphar.2023.1098976,10.1186/s43058-023-00521-4,10.1177/26334895231199467,10.1002/adom.202303199,10.1002/adom.202301232,10.1016/j.energy.2024.130322,10.1126/sciimmunol.abo4365,10.1515/sem-2023-0178,10.1364/boe.506664,10.1364/boe.494585,10.3847/1538-4357/ac4601,10.1371/journal.pone.0284416,10.1080/07350015.2023.2271039,10.1093/mnras/stae385,10.1093/mnras/stad2760,10.1002/ange.202320045,10.1002/anie.202320045,10.1016/j.chembiol.2024.02.012,10.1101/2023.11.29.569293,10.1038/s41467-023-41197-7,10.35772/ghm.2023.01065,10.3390/v15040896,10.1111/dar.13836,10.1063/5.0153862,10.1109/imoc57131.2023.10379741,10.1109/imoc57131.2023.10379729,10.1109/access.2023.3339563,10.1109/ojpel.2023.3339014,10.1109/csci58124.2022.00203,10.1016/j.ssci.2022.105967,10.1007/978-3-031-06015-1_8,10.1101/2023.01.19.524726,10.1007/s00382-023-07058-1,10.1002/oa.3284,10.1136/bmjopen-2023-080603,10.1101/2023.08.02.551649,10.1099/mgen.0.000965,10.2140/ant.2022.16.2005,10.1103/physrevlett.132.103402,10.21468/scipostphys.15.2.068,10.1080/02606755.2023.2213550,10.3390/rs15204928,10.1063/5.0203603,10.1103/physrevapplied.21.054027,10.1109/icecom58258.2023.10367924,10.1109/icecom58258.2023.10367934,10.1109/icecom58258.2023.10367938,10.1109/icecom58258.2023.10367923,10.1109/metamaterials58257.2023.10289546,10.23919/ursigass57860.2023.10265525,10.1109/elmar59410.2023.10253914,10.1002/pen.26771,10.1016/j.canep.2023.102451,10.3390/biomedicines11051344,10.3390/pharmaceutics15010181,10.1037/fam0001189,10.3390/su15129371,10.1038/s44221-024-00208-7,10.1093/evolut/qpae036,10.1093/evolut/qpae024,10.3390/micro4010008,10.3390/molecules28196822,10.1007/s11673-023-10285-0,10.1021/acsnano.3c09776,10.1101/2023.09.08.556607,10.1016/j.snb.2023.133733,10.1016/j.ocecoaman.2023.106961,10.1016/j.tre.2023.103169,10.1016/j.elerap.2023.101336,10.1590/0001-3765202320230351,10.1590/s1678-3921.pab2023.v58.03246,10.1038/s41598-024-56540-1,10.1364/ol.494369,10.1017/s0963180124000112,10.1136/jme-2023-109568,10.1111/japp.12655,10.1038/s41539-023-00170-1,10.1016/j.neubiorev.2023.105153,10.1007/s00158-023-03663-0,10.3390/ma16145076,10.1007/978-3-031-55260-1_15,10.1007/s11228-024-00719-1,10.1007/s00205-023-01948-8,10.1142/s0219199723500657,10.1007/s12220-023-01484-7,10.1007/s10957-023-02344-8,10.1007/978-3-031-46359-4_2,10.1007/s10208-023-09629-4,10.1007/s00245-023-10029-x,10.1007/s00028-023-00902-1,10.1016/j.jde.2023.06.004,10.1007/s00030-023-00857-9,10.1007/s11579-023-00333-z,10.1061/jmenea.meeng-5794,10.1177/21695067231194338,10.1038/s41597-024-03034-4,10.1039/d3ew00347g,10.1101/2024.05.17.24307550,10.1101/2024.01.09.24301073,10.1038/s41598-023-41853-4,10.1111/sjos.12685,10.1038/s41593-023-01321-8,10.1016/j.jclinepi.2023.02.020,10.1371/journal.pone.0280192,10.1016/j.jbi.2022.104243,10.1016/j.eclinm.2022.101724,10.38107/037,10.1002/adfm.202314696,10.1063/5.0168129,10.1103/physrevmaterials.7.064202,10.1038/s41699-023-00404-1,10.1061/jsendh.steng-12655,10.1186/s40623-023-01940-2,10.1029/2022ja031231,10.1029/2023ja031663,10.1029/2022gl101465,10.21203/rs.3.rs-4345687/v1,10.1093/toxsci/kfae021,10.1101/2023.08.28.555101,10.1103/physrevb.109.205125,10.1111/cgf.14942,10.1109/tpami.2022.3163720,10.1016/j.csl.2024.101623,10.1039/d0sc01737j,10.1186/s12889-023-17570-y,10.1080/13218719.2023.2243303,10.5694/mja2.52089,10.1177/00938548231170799,10.1007/s11150-024-09710-z,10.1016/j.jbankfin.2023.107047,10.1016/j.euroecorev.2023.104632,10.1038/s41598-023-30724-7,10.1038/s41598-023-29536-6,10.1111/obes.12545,10.1016/j.jebo.2022.11.027,10.3389/fimmu.2023.1060258,10.1016/j.jhydrol.2024.130983,10.1101/2024.03.18.585583,10.1016/j.celrep.2024.113675,10.1103/physrevx.14.021017,10.1038/s41559-024-02331-w,10.1016/j.gloplacha.2024.104354,10.1038/s41467-023-41685-w,10.1126/sciadv.adg7679,10.1144/sp532-2022-1,10.1523/jneurosci.0226-23.2023,10.1101/2023.01.11.523491,10.1073/pnas.2309379120,10.1073/pnas.2301947120,10.1038/s41467-024-48673-8,10.1038/s41467-024-47953-7,10.1016/j.fsigen.2024.103048,10.1093/bib/bbad163,10.1101/2023.12.12.570420,10.1016/j.celrep.2023.113331,10.1103/physrevd.108.105013,10.1007/jhep11(2023)005,10.1101/2024.01.29.574039,10.1126/scitranslmed.adi9711,10.3390/cancers15143723,10.1021/acsnano.3c11337,10.1038/s41467-023-36133-8,10.1016/j.cobme.2024.100547,10.1002/ange.202319567,10.1002/anie.202319567,10.1016/j.jfca.2023.105901,10.1016/j.foodcont.2023.109969,10.1016/j.respol.2024.104954,10.1371/journal.pbio.3002513,10.1109/qce57702.2023.00111,10.1109/iccad57390.2023.10323863,10.1016/j.ic.2023.105077,10.1145/3582016.3582039,10.1109/tcad.2022.3179223,10.1145/3517145,10.1016/j.tcs.2022.02.017,10.1145/3514355,10.1145/3514239,10.1038/s41598-024-51799-w,10.3390/cells12242815,10.5771/9783748935544,10.1016/j.eswa.2024.124100,10.1016/j.frl.2024.105308,10.12688/openreseurope.16436.1,10.12688/openreseurope.16278.1,10.12688/openreseurope.15386.1,10.3390/foods12244484,10.1057/s42984-024-00090-3,10.1002/anie.202315985,10.1002/ange.202315985,10.1161/atvbaha.123.319821,10.1093/cvr/cvad149,10.1161/strokeaha.123.042714,10.1016/j.jtha.2023.04.002,10.1182/bloodadvances.2023010100,10.3389/fphar.2024.1379236,10.1101/2023.07.03.547532,10.1103/physreve.107.l052602,10.1063/5.0133871,10.1109/icnwc57852.2023.10127328,10.1016/j.atech.2023.100265,10.1016/j.cct.2023.107387,10.1155/2023/2397564,10.1007/s10502-024-09441-1,10.1111/gcb.16637,10.3390/ma16051978,10.21203/rs.3.rs-4271873/v1,10.1038/s41419-024-06693-8,10.1038/s41598-024-56928-z,10.1016/j.chemgeo.2024.122157,10.1016/j.chemgeo.2022.121064,10.2343/geochemj.gj22004,10.1016/j.jwpe.2023.104395,10.1016/j.jece.2023.111107,10.1080/02614367.2022.2162109,10.1109/twc.2024.3400601,10.1109/globecom54140.2023.10437972,10.1109/twc.2023.3344802,10.1109/tifs.2023.3268443,10.1093/ptep/ptae021,10.1021/accountsmr.4c00071,10.26434/chemrxiv-2024-hvxml,10.1039/d4nr01024h,10.1038/s42004-024-01143-0,10.1039/d3dd00236e,10.1039/d3tc03606e,10.1021/acs.chemmater.3c01744,10.1021/acs.inorgchem.3c02337,10.1063/5.0144827,10.1002/anie.202314378,10.1002/ange.202314378,10.1039/d3ta04707e,10.1039/d3ce00881a,10.1002/asia.202300673,10.1038/s41467-023-38737-6,10.26434/chemrxiv-2023-d1s8w,10.1002/adma.202211478,10.1145/3589334.3645329,10.1029/2023gl104396,10.20396/cel.v65i00.8673331,10.1016/j.procs.2023.08.230,10.1371/journal.pbio.3001984,10.1101/2022.04.22.489138,10.1002/brb3.3490,10.1016/j.clinph.2024.04.002,10.1111/ejn.16001,10.3389/fneur.2023.1177589,10.1016/j.clinph.2022.08.015,10.1101/2024.05.23.24307833,10.1093/ofid/ofad655,10.1093/ofid/ofae018,10.1371/journal.pone.0297775,10.21203/rs.3.rs-2640564/v3,10.1002/saj2.20688,10.1071/sr23164,10.1029/2023gl104852,10.1038/s41598-022-10957-8,10.1186/s40623-022-01584-8,10.1111/nph.19336,10.3389/fpsyg.2022.1014713,10.3390/v15102029,10.3389/fnut.2023.1215768,10.3390/educsci13080838,10.12688/routledgeopenres.17798.2,10.12688/routledgeopenres.17798.1,10.1080/00031305.2023.2232006,10.1080/0969725x.2023.2270357,10.1177/00345237231183343,10.1016/j.ijheatmasstransfer.2023.124665,10.1039/d3qm01106b,10.1016/j.mechmachtheory.2023.105508,10.1016/j.scib.2024.02.010,10.1088/1674-4527/ace179,10.1126/science.abl7759,10.1016/j.scitotenv.2024.172840,10.1016/j.envint.2024.108601,10.1016/j.envint.2024.108454,10.1016/j.envint.2023.108375,10.1016/j.envres.2023.117611,10.1016/j.envres.2023.117832,10.2337/dc23-0327,10.1021/acs.est.3c02765,10.1021/acs.est.3c00848,10.1007/s40726-023-00269-4,10.1021/acs.analchem.3c00376,10.1289/ehp11372,10.1101/2023.02.09.527886,10.3390/make6020035,10.1016/j.micromeso.2024.113042,10.3390/make6010014,10.1016/j.compag.2024.108650,10.1038/s41598-023-34320-7,10.1016/j.compag.2022.107325,10.1145/3615894.3628507,10.1016/j.scs.2023.104435,10.1093/jipm/pmac028,10.1145/3651171,10.1016/j.clsr.2024.105934,10.1145/3594739.3605113,10.1093/lambio/ovae041,10.1007/s12155-024-10734-7,10.1016/j.carres.2024.109068,10.1007/s00253-023-12908-3,10.1007/s00289-024-05152-w,10.3390/polysaccharides4020013,10.3389/fagro.2023.1148969,10.1038/s41586-024-07473-2,10.1101/2023.11.30.569198,10.1186/s13015-024-00254-6,10.1007/978-1-0716-3989-4_3,10.4230/lipics.wabi.2023.17,10.1186/s13015-024-00261-7,10.1101/2023.11.22.568259,10.1093/gbe/evad205,10.1101/gr.277679.123,10.1101/2023.06.21.545862,10.1145/3571723,10.1101/2023.05.12.540616,10.1101/2023.03.02.530874,10.1101/2023.01.30.526175,10.1101/2022.12.23.521809,10.1038/s41390-023-02992-6,10.1001/jama.2023.20358,10.1542/hpeds.2023-007246,10.1016/j.jpeds.2023.113499,10.1093/jamia/ocad053,10.1093/jamia/ocac251,10.1038/s41598-024-54655-z,10.1172/jci175031,10.3389/fgene.2023.1304425,10.1186/s13578-023-01102-7,10.1016/j.gendis.2022.11.003,10.1002/mp.16880,10.1002/mp.16352,10.1016/j.scitotenv.2022.158267,10.1016/j.foreco.2022.120301,10.1016/j.ecolind.2022.109004,10.1073/pnas.2318333121,10.1063/5.0158930,10.1145/3588432.3591521,10.1063/5.0142166,10.1038/s41467-024-46494-3,10.1128/mbio.02479-23,10.1101/2023.09.08.556855,10.1101/2023.08.31.555785,10.1186/s40168-022-01378-w,10.1101/2023.12.18.572279,10.1093/nar/gkad1164,10.1101/2023.12.03.569795,10.1101/2023.07.26.550759,10.1186/s12864-023-09265-w,10.1021/acsanm.3c05701,10.1016/j.apsusc.2023.158316,10.1080/03057240.2024.2333577,10.3390/rel14121517,10.3390/rel14111427,10.1109/icops45740.2023.10480948,10.1109/icops45740.2023.10481052,10.1109/icops45740.2023.10481130,10.1038/s41598-024-51298-y,10.1109/ppc47928.2023.10311041,10.1109/ppc47928.2023.10310918,10.1049/hve2.12382,10.21203/rs.3.rs-3143506/v1,10.4271/03-16-08-0061,10.1080/02560046.2024.2316302,10.1177/01634437231219141,10.1177/16094069231182015,10.1177/00113921231182182,10.1002/cjce.25286,10.1080/07373937.2024.2318437,10.1016/j.etap.2024.104382,10.1080/19440049.2023.2283769,10.3390/ani13152499,10.1016/j.jet.2024.105798,10.1038/s41467-023-41107-x,10.1016/j.oneear.2023.05.006,10.1088/1748-9326/acd5e8,10.1088/1748-9326/aca815,10.1145/3617232.3624856,10.1109/cloudcom59040.2023.00047,10.1007/s11761-024-00391-1,10.1109/percomworkshops56833.2023.10150370,10.1016/j.comcom.2023.04.027,10.1109/apsec57359.2022.00034,10.1109/cloudcom55334.2022.00016,10.1371/journal.pone.0285434,10.1186/s13578-023-01012-8,10.1161/strokeaha.122.041651,10.1080/15534510.2023.2279662,10.1111/nana.12994,10.1080/14680777.2023.2258298,10.1038/s41598-023-35252-y,10.1177/10596011231193176,10.1016/j.jhin.2023.03.002,10.1177/10596011221150756,10.1080/08039488.2024.2322495,10.1007/s00787-024-02406-w,10.1142/s0219877024500275,10.1155/2023/2516746,10.1080/08039488.2023.2222698,10.3389/fpsyg.2023.1183704,10.1111/acer.15119,10.1080/20008066.2023.2191396,10.1007/s00787-022-02107-2,10.1007/s11218-022-09734-2,10.1016/j.rssm.2023.100876,10.3390/f15020354,10.1007/s11629-023-8914-3,10.14746/quageo-2023-0016,10.18146/view.297,10.18146/tmg.835,10.5117/9789463727815,10.1177/08912424231163485,10.1007/978-94-6265-515-7,10.1038/s41467-023-41057-4,10.1093/gigascience/giad047,10.1038/s41592-023-01886-z,10.1093/nar/gkad289,10.1101/2023.01.21.525030,10.1016/j.gpb.2022.09.011,10.1021/acs.jpcb.4c01987,10.1021/acs.jctc.3c00663,10.1021/acs.jpcb.3c04473,10.26434/chemrxiv-2023-w0h1p,10.1073/pnas.2305899120,10.1101/2023.05.01.538927,10.1101/2023.12.22.23300430,10.1002/agt2.386,10.1002/adfm.202214179,10.1109/milcom58377.2023.10356332,10.1101/2024.05.03.24306699,10.1101/2024.04.16.24305925,10.1101/2023.10.25.23297571,10.3389/fphys.2023.1202186,10.1103/physrevb.109.205301,10.1103/physrevb.108.195303,10.1523/eneuro.0197-23.2023,10.3390/v15091897,10.1016/j.prdoa.2024.100251,10.3390/ijms24108995,10.3390/ijms24032247,10.1016/j.isci.2023.108171,10.1158/2326-6066.cir-23-0496,10.1101/2023.12.07.570715,10.1016/j.cell.2023.11.008,10.1093/abt/tbad025,10.1016/j.celrep.2023.113280,10.1101/2023.06.18.545488,10.3390/cancers15102788,10.1101/2023.03.07.531525,10.1080/13543784.2023.2179482,10.1016/j.bbrc.2022.09.019,10.3389/fimmu.2022.996026,10.1111/liv.15927,10.1101/2023.11.17.23298672,10.1111/liv.15665,10.1016/j.cgh.2023.04.016,10.1016/j.jhepr.2022.100667,10.1007/s11914-023-00843-1,10.1007/s11914-023-00842-2,10.1007/s11914-023-00855-x,10.3390/rs15235545,10.1029/2022gl102689,10.3390/rs14236069,10.1038/s41467-024-46327-3,10.1002/cam4.6761,10.3389/fonc.2023.1100585,10.1109/vtc2023-fall60731.2023.10333522,10.1128/jvi.00100-23,10.1021/acs.jpcc.3c05477,10.1021/acsaem.3c01370,10.3389/fnins.2023.1217993,10.1016/j.visres.2023.108296,10.1016/j.jad.2023.07.014,10.1001/jamanetworkopen.2023.17905,10.1007/s00371-024-03454-8,10.1109/smc53992.2023.10394105,10.1007/s00521-023-09367-2,10.1145/3582700.3582707,10.1007/s10803-024-06302-9,10.1016/j.psychres.2024.115838,10.1016/j.rasd.2024.102339,10.1177/13623613231213543,10.1007/s10803-023-06039-x,10.1016/j.jplph.2023.154138,10.1016/j.freeradbiomed.2024.04.217,10.1016/j.freeradbiomed.2023.06.021,10.1093/jncimonographs/lgad014,10.1038/s41467-023-37269-3,10.1111/liv.15893,10.1101/2023.04.25.538102,10.1063/5.0142200,10.1016/b978-0-323-95124-1.00017-6,10.1101/2023.05.17.541187,10.1101/2023.05.17.541174,10.1007/s00415-024-12430-0,10.1093/ntr/ntae084,10.1093/schbul/sbae024,10.1038/s41386-024-01842-1,10.21203/rs.3.rs-3168186/v1,10.1101/2023.08.21.23294348,10.1038/s41380-023-02165-1,10.1136/bmjopen-2022-066249,10.1038/s41585-024-00869-9,10.1158/0008-5472.can-23-0555,10.1101/2022.11.02.514910,10.3390/s24072335,10.1109/sensors56945.2023.10324963,10.1038/s41528-023-00258-z,10.3390/bios12050322,10.1371/journal.pone.0288803,10.3389/fpubh.2023.1219676,10.1016/j.soard.2023.09.026,10.3389/fpsyg.2023.1106571,10.2196/46415,10.1101/2023.04.20.23288698,10.1111/joes.12620,10.1101/2024.04.22.24306094,10.1007/s00401-024-02721-1,10.1101/2024.02.28.582621,10.1016/j.neuron.2024.01.008,10.1002/alz.13576,10.1001/jamaneurol.2023.3599,10.1186/s40478-023-01626-6,10.1111/acel.13938,10.1101/2023.07.20.23292771,10.1101/2023.07.06.23292312,10.1101/2023.04.21.23288938,10.1186/s13024-022-00590-4,10.1186/s13058-024-01777-x,10.1117/1.jmi.10.5.054503,10.1002/mp.17040,10.1016/j.brat.2024.104494,10.1176/appi.ajp.20230272,10.1001/jamapsychiatry.2023.5138,10.1016/j.addbeh.2023.107911,10.1016/j.explore.2023.11.001,10.1038/s44220-023-00084-2,10.1007/s40429-023-00501-7,10.1016/j.drugalcdep.2023.109890,10.1145/3631461.3631550,10.1016/j.jcss.2023.02.004,10.1080/15384101.2021.2023304,10.3390/ijms241713272,10.1016/j.jval.2024.01.020,10.1038/s41366-023-01396-0,10.1021/acs.jpcc.3c04680,10.1021/acs.jpcc.4c01814,10.4025/actascilangcult.v45i2.67723,10.1007/s10915-023-02353-9,10.1007/s42967-023-00287-5,10.1007/s10543-023-00954-2,10.1128/jvi.00398-22,10.1093/genetics/iyad216,10.1101/2023.10.17.562696
9852805,0.640208,0.868607,0.827553,0.607245,0.891885,0.759265,0.699039,0.59872,0.632743,0.718642,0.863429,0.677742,0.791593,0.767135,0.812592,0.754923,0.615832,0.57179,0.811416,0.681292,0.873749,0.604014,0.702269,0.646478,0.816364,0.843998,0.753721,0.743177,0.765359,0.92047,0.636948,0.712922,0.788715,0.724764,0.743177,0.818859,0.978845,0.805778,0.596194,0.743177,0.819322,0.93725,0.978845,0.969027,0.788715,0.978845,0.978644,0.646041,0.920532,0.978845,0.698691,0.628137,0.732315,0.819778,0.67785,0.843998,0.894805,0.900348,0.969027,0.754815,0.677742,0.909332,0.636948,0.891885,0.693001,0.753709,0.768958,0.831824,0.677742,0.879914,0.92047,0.696558,0.732315,0.733792,0.651222,0.864168,0.854686,0.788715,0.849756,0.724511,0.581588,0.878707,0.865337,0.72263,0.631157,0.861146,0.791593,0.900998,0.788715,0.709741,0.739586,0.786077,0.775578,0.83807,0.70665,0.70665,0.812467,0.648089,0.702269,0.841743,0.613028,0.92631,0.891885,0.739586,0.631351,0.692603,0.717758,0.613453,0.702269,0.759265,0.702269,0.793828,0.677742,0.947678,0.788715,0.897695,0.865242,0.705209,0.732315,0.724511,0.628336,0.702269,0.548603,0.776987,0.623513,0.677916,0.544411,0.785306,0.677742,0.586266,0.72462,0.573996,0.677742,0.694594,0.813578,0.661728,0.762282,0.66117,0.532873,0.780835,0.878567,0.843998,0.940108,0.936501,0.735027,0.922528,0.831824,0.863746,0.631157,0.603984,0.743366,0.861197,0.788715,0.987063,0.98394,0.900922,0.782274,0.767799,0.812467,0.677742,0.754923,0.915078,0.626977,0.913643,0.739586,0.743177,0.863329,0.759265,0.759265,0.744466,0.791593,0.657768,0.544749,0.58463,0.741512,0.813505,0.826609,0.930677,0.601892,0.641477,0.641477,0.677742,0.714073,0.843998,0.778165,0.748691,0.752131,0.655452,0.646041,0.929861,0.847797,0.788715,0.730252,0.900922,0.981496,0.615832,0.569736,0.764257,0.827553,0.615719,0.654953,0.677742,0.930223,0.961635,0.779463,0.824579,0.682536,0.759265,0.701651,0.560734,0.718642,0.806595,0.909332,0.74464,0.72263,0.641477,0.900922,0.890843,0.762282,0.736504,0.710486,0.706056,0.917338,0.631351,0.544332,0.544332,0.818859,0.868607,0.791593,0.79166,0.732456,0.636948,0.982518,0.641477,0.70665,0.908404,0.841743,0.929818,0.788715,0.759793,0.736877,0.818859,0.844146,0.940276,0.718642,0.807331,0.732315,0.705073,0.978667,0.890843,0.92066,0.970461,0.785306,0.974897,0.978845,0.831824,0.863329,0.788715,0.92047,0.743177,0.694594,0.790498,0.768958,0.904284,0.868607,0.646041,0.788715,0.880831,0.880831,0.677742,0.631157,0.615832,0.955897,0.806595,0.623513,0.712922,0.740981,0.843998,0.847797,0.824579,0.792576,0.826264,0.98395,0.604014,0.741575,0.788715,0.788715,0.579661,0.70665,0.846824,0.724997,0.79166,0.650057,0.664794,0.697765,0.842686,0.756904,0.816493,0.694594,0.548603,0.560734,0.601892,0.826246,0.646041,0.570425,0.595266,0.654953,0.759265,0.730252,0.730252,0.743177,0.702269,0.839156,0.639855,0.623513,0.763062,0.915153,0.754923,0.983999,0.897292,0.739954,0.739954,0.681018,0.677742,0.79166,0.730609,0.806595,0.618415,0.651222,0.659965,0.631318,0.648714,0.872475,0.681018,0.890894,0.788715,0.791593,0.018627,0.730135,0.782755,0.92047,0.654953,0.777209,0.777209,0.863329,0.928888,0.878567,0.718642,0.628237,0.727906,0.649122,0.739282,0.775578,0.617915,0.544387,0.613398,0.710208,0.733234,0.813812,0.636948,0.729277,0.641477,0.570802,0.716725,0.54611,0.716725,0.560734,0.61715,0.557524,0.646041,0.615832,0.565234,0.790498,0.831914,0.677742,0.790498,0.679681,0.818859,0.600438,0.718642,0.661728,0.607245,0.718642,0.909332,0.587332,0.763314,0.698828,0.638384,0.950931,0.919722,0.974859,0.929818,0.937517,0.831824,0.969027,0.879233,0.638384,0.886588,0.677742,0.93725,0.702269,0.743177,0.863429,0.774453,0.66438,0.636948,0.631545,0.768958,0.83807,0.774453,0.706835,0.641587,0.714073,0.812592,0.730252,0.649684,0.607245,0.658832,0.739586,0.562475,0.555158,0.551251,0.551251,0.607245,0.778165,0.791593,0.790498,0.872436,0.790498,0.744466,0.791593,0.746977,0.646041,0.677742,0.868886,0.573996,0.555158,0.654953,0.628137,0.677742,0.677742,0.677987,0.628137,0.921654,0.754815,0.7906,0.72462,0.732315,0.909332,0.890843,0.677916,0.696558,0.751582,0.677742,0.724511,0.925138,0.638384,0.808886,0.863329,0.969098,0.890843,0.681292,0.786459,0.62091,0.651662,0.659965,0.8592,0.820655,0.754923,0.679289,0.695912,0.808886,0.730958,0.677742,0.61715,0.642405,0.643927,0.622637,0.637784,0.890843,0.934447,0.85095,0.661728,0.689628,0.641587,0.702269,0.610687,0.607245,0.737968,0.74513,0.943219,0.950275,0.878707,0.710883,0.808964,0.595266,0.626977,0.754815,0.818859,0.743366,0.632663,0.693001,0.939433,0.818859,0.712922,0.646041,0.919853,0.901869,0.912481,0.905058,0.914092,0.951696,0.917383,0.921549,0.870803,0.890127,0.851758,0.901937,0.894605,0.893955,0.898243,0.895805,0.899082,0.912301,0.901168,0.901321,0.902122,0.907754,0.899022,0.90131,0.804107,0.934052,0.899003,0.896823,0.901695,0.924577,0.89506,0.891748,0.840864,0.926099,0.942874,0.894027,0.906809,0.89506,0.910916,0.916762,0.888939,0.896173,0.901274,0.897778,0.914933,0.899856,0.890884,0.923368,0.897018,0.901179,0.894591,0.893129,0.933555,0.914301,0.909832,0.911852,0.923505,0.940082,0.901454,0.903654,0.902393,0.895621,0.841629,0.896446,0.901788,0.899434,0.905471,0.841036,0.866529,0.918414,0.918773,0.910064,0.928066,0.910391,0.924686,0.949512,0.934919,0.938898,0.907398,0.910603,0.897965,0.895103,0.889734,0.896932,0.920745,0.919992,0.923713,0.915982,0.909444,0.924483,0.913505,0.911115,0.90939,0.923804,0.905598,0.866832,0.908278,0.915492,0.923019,0.906769,0.923668,0.908737,0.901637,0.91599,0.91703,0.900307,0.904531,0.91743,0.908221,0.912756,0.944328,0.916549,0.910515,0.94445,0.871016,0.881765,0.895398,0.904232,0.934626,0.967343,0.837607,0.902339,0.887695,0.896261,0.862315,0.899377,0.911182,0.91388,0.922188
13062422,0.653853,0.771239,0.7714,0.316196,0.811767,0.580869,0.476012,0.301353,0.360589,0.510143,0.762224,0.438934,0.637155,0.594571,0.673715,0.573311,0.331146,0.254467,0.671666,0.445116,0.780192,0.573122,0.481638,0.667261,0.680281,0.728393,0.573311,0.55286,0.602118,0.861535,0.367911,0.500184,0.632143,0.596926,0.55286,0.684624,0.963169,0.661851,0.296956,0.55286,0.685432,0.890749,0.963169,0.946074,0.632143,0.963169,0.962818,0.383742,0.861643,0.963169,0.475408,0.352569,0.533948,0.686225,0.439122,0.728393,0.81685,0.826502,0.946074,0.573122,0.438934,0.842143,0.367911,0.811767,0.465501,0.681147,0.597745,0.707198,0.438934,0.790925,0.861535,0.471694,0.533948,0.536519,0.392761,0.763511,0.747001,0.632143,0.738418,0.520361,0.271526,0.788823,0.765546,0.517086,0.357827,0.758248,0.637155,0.827633,0.632143,0.55286,0.546608,0.62755,0.673497,0.718073,0.489264,0.489264,0.673497,0.387306,0.481638,0.724467,0.326264,0.933175,0.811767,0.546608,0.358165,0.464807,0.508604,0.327005,0.481638,0.580869,0.481638,0.641046,0.438934,0.882113,0.632143,0.821882,0.76538,0.486755,0.533948,0.520361,0.352917,0.481638,0.214098,0.611724,0.344519,0.439237,0.206799,0.626208,0.438934,0.27967,0.52055,0.258308,0.438934,0.468275,0.67543,0.411053,0.586122,0.525864,0.382122,0.618425,0.788579,0.728393,0.895725,0.889445,0.53867,0.929746,0.707198,0.728032,0.357827,0.310518,0.553189,0.758337,0.632143,0.977476,0.972039,0.8275,0.681147,0.928052,0.673497,0.438934,0.573311,0.852146,0.35055,0.849649,0.546608,0.55286,0.76205,0.580869,0.580869,0.555104,0.637155,0.404158,0.207388,0.276822,0.549961,0.675304,0.698118,0.879306,0.306876,0.375796,0.375796,0.438934,0.502187,0.728393,0.613775,0.543917,0.568448,0.400126,0.383742,0.877885,0.735007,0.632143,0.530356,0.8275,0.967783,0.331146,0.250891,0.589561,0.7714,0.330949,0.399258,0.438934,0.842786,0.933205,0.616035,0.694584,0.44728,0.580869,0.48056,0.235218,0.510143,0.663273,0.842143,0.555406,0.517086,0.375796,0.8275,0.809952,0.586122,0.553189,0.495943,0.501559,0.867821,0.358165,0.206661,0.206661,0.684624,0.771239,0.637155,0.63727,0.534194,0.367911,0.969563,0.375796,0.489264,0.840527,0.724467,0.877811,0.632143,0.581789,0.541892,0.684624,0.728652,0.94584,0.510143,0.664555,0.533948,0.547656,0.962859,0.809952,0.928052,0.948571,0.626208,0.956295,0.963169,0.707198,0.76205,0.632143,0.861535,0.55286,0.468275,0.635247,0.597745,0.833354,0.771239,0.383742,0.632143,0.792522,0.792522,0.438934,0.357827,0.331146,0.923215,0.663273,0.344519,0.500184,0.620676,0.728393,0.735007,0.694584,0.638865,0.697519,0.972056,0.573122,0.60364,0.632143,0.632143,0.26817,0.489264,0.733314,0.521207,0.63727,0.390733,0.41639,0.473795,0.726109,0.576759,0.680507,0.468275,0.214098,0.235218,0.306876,0.769668,0.383742,0.25209,0.29534,0.399258,0.580869,0.530356,0.530356,0.55286,0.481638,0.719964,0.372971,0.344519,0.58748,0.852277,0.573311,0.972142,0.90686,0.547248,0.547248,0.444639,0.438934,0.63727,0.530979,0.663273,0.335643,0.392761,0.407984,0.358108,0.388395,0.777974,0.444639,0.810041,0.632143,0.637155,0.632765,0.4305,0.621767,0.861535,0.399258,0.612111,0.612111,0.76205,0.876191,0.788579,0.510143,0.352743,0.526272,0.438934,0.607312,0.673497,0.334772,0.206757,0.326909,0.495459,0.579769,0.675838,0.367911,0.528659,0.375796,0.252747,0.506805,0.209757,0.506805,0.235218,0.33344,0.229629,0.383742,0.331146,0.243052,0.635247,0.707355,0.438934,0.635247,0.44231,0.684624,0.304345,0.510143,0.411053,0.316196,0.510143,0.842143,0.281526,0.587919,0.475646,0.37041,0.955502,0.927201,0.956229,0.877811,0.891214,0.707198,0.946074,0.921534,0.37041,0.802544,0.438934,0.890749,0.481638,0.55286,0.762224,0.607312,0.41567,0.367911,0.358502,0.597745,0.718073,0.607312,0.489587,0.375987,0.502187,0.673715,0.530356,0.399535,0.316196,0.462566,0.546608,0.238249,0.225511,0.218708,0.218708,0.316196,0.613775,0.637155,0.635247,0.777905,0.635247,0.555104,0.637155,0.559475,0.383742,0.438934,0.771724,0.258308,0.225511,0.399258,0.352569,0.438934,0.438934,0.439362,0.352569,0.863597,0.573122,0.635425,0.52055,0.533948,0.842143,0.809952,0.439237,0.471694,0.567493,0.438934,0.520361,0.932112,0.37041,0.667261,0.76205,0.946198,0.809952,0.445116,0.628216,0.339987,0.393527,0.407984,0.754861,0.687752,0.573311,0.441628,0.470569,0.667261,0.531585,0.438934,0.33344,0.37741,0.380061,0.342993,0.369365,0.809952,0.940554,0.740498,0.411053,0.459629,0.375987,0.481638,0.331441,0.316196,0.543791,0.556259,0.901142,0.913427,0.788823,0.496634,0.667397,0.29534,0.35055,0.573122,0.684624,0.553189,0.36045,0.465501,0.945075,0.684624,0.500184,0.383742,0.92732,0.911011,0.885289,0.913903,0.922095,0.956196,0.957901,0.928858,0.915428,0.901247,0.914809,0.897872,0.904424,0.903835,0.899949,0.906351,0.909296,0.920472,0.910376,0.910514,0.91124,0.879092,0.908429,0.910504,0.870405,0.931318,0.911899,0.893499,0.884385,0.901143,0.904837,0.902704,0.918499,0.932984,0.943832,0.9039,0.915491,0.904837,0.919215,0.902105,0.899285,0.905846,0.870599,0.907301,0.922858,0.909186,0.901927,0.933153,0.921698,0.883779,0.904412,0.859923,0.921855,0.922285,0.918233,0.920064,0.910036,0.945664,0.911428,0.913405,0.899248,0.905346,0.918891,0.906093,0.910937,0.895265,0.917541,0.909162,0.900524,0.928831,0.93824,0.906335,0.934768,0.941342,0.901285,0.955021,0.854669,0.944591,0.908022,0.919651,0.894678,0.862511,0.900007,0.906534,0.89612,0.905904,0.93082,0.923809,0.905689,0.931518,0.921563,0.919395,0.917832,0.900129,0.914392,0.847316,0.916823,0.923365,0.930191,0.915455,0.920504,0.917239,0.910801,0.923817,0.90242,0.909595,0.913425,0.914007,0.916771,0.923895,0.949514,0.924324,0.921941,0.950943,0.901927,0.89278,0.905143,0.887368,0.940716,0.970386,0.916831,0.89829,0.898158,0.909507,0.802508,0.882709,0.919456,0.922597,0.930063
13528070,0.97042,0.980451,0.91142,0.941565,0.016937,0.964183,0.955222,0.940297,0.945359,0.958139,0.979681,0.952054,0.968993,0.965354,0.972117,0.963537,0.942843,0.93629,0.971942,0.952582,0.981216,0.963521,0.955703,0.971566,0.972678,0.97679,0.963537,0.961789,0.965999,0.988167,0.945985,0.957288,0.968565,0.905874,0.961789,0.973049,0.996853,0.971103,0.939921,0.961789,0.973118,0.990664,0.996853,0.995392,0.968565,0.996853,0.996823,0.947337,0.988177,0.996853,0.955171,0.944674,0.960173,0.973186,0.95207,0.97679,0.984349,0.985174,0.995392,0.963521,0.952054,0.98651,0.945985,0.983915,0.954324,0.925542,0.965625,0.974978,0.952054,0.982133,0.988167,0.954853,0.960173,0.960393,0.948108,0.979791,0.97838,0.968565,0.977646,0.959012,0.937748,0.981954,0.979965,0.958732,0.945123,0.979341,0.968993,0.98527,0.968565,0.961789,0.961255,0.968172,0.972099,0.975908,0.956355,0.956355,0.972099,0.947642,0.955703,0.976454,0.942426,0.946095,0.983915,0.961255,0.945152,0.954265,0.958008,0.942489,0.955703,0.964183,0.955703,0.969325,0.952054,0.961726,0.968565,0.984779,0.97995,0.956141,0.960173,0.959012,0.944703,0.955703,0.93284,0.96682,0.943986,0.95208,0.932217,0.968057,0.952054,0.938444,0.959028,0.936618,0.952054,0.954561,0.972264,0.949671,0.964632,0.959483,0.947199,0.967392,0.981933,0.97679,0.991089,0.990553,0.960577,0.943329,0.974978,0.641394,0.945123,0.94108,0.961818,0.979349,0.968565,0.998075,0.997611,0.985259,0.925542,0.941962,0.972099,0.952054,0.963537,0.987365,0.944501,0.987152,0.961255,0.961789,0.979666,0.964183,0.964183,0.961981,0.968993,0.949082,0.932267,0.938201,0.961542,0.972253,0.974203,0.989686,0.940769,0.946658,0.946658,0.952054,0.957459,0.97679,0.966995,0.96261,0.963122,0.948738,0.947337,0.989565,0.977355,0.968565,0.959866,0.985259,0.997247,0.942843,0.935985,0.964926,0.924301,0.942826,0.948663,0.952054,0.948957,0.994292,0.967188,0.973901,0.952767,0.964183,0.955611,0.934645,0.958139,0.971225,0.98651,0.962007,0.958732,0.946658,0.985259,0.983759,0.964632,0.961818,0.956926,0.957406,0.988705,0.945152,0.932205,0.932205,0.973049,0.980451,0.968993,0.969003,0.960194,0.945985,0.997399,0.946658,0.956355,0.986372,0.976454,0.989558,0.968565,0.964262,0.960852,0.973049,0.976812,0.956311,0.958139,0.971334,0.960173,0.913414,0.996826,0.983759,0.941962,0.995605,0.968057,0.996265,0.996853,0.974978,0.979666,0.968565,0.988167,0.961789,0.954561,0.96883,0.965625,0.985759,0.980451,0.947337,0.968565,0.98227,0.98227,0.952054,0.945123,0.942843,0.993438,0.971225,0.943986,0.957288,0.91142,0.97679,0.977355,0.973901,0.969139,0.974151,0.997612,0.963521,0.92413,0.968565,0.968565,0.937461,0.956355,0.97721,0.959085,0.969003,0.947935,0.950127,0.955033,0.976595,0.963832,0.972698,0.954561,0.93284,0.934645,0.940769,0.923727,0.947337,0.936087,0.939783,0.948663,0.964183,0.959866,0.959866,0.961789,0.955703,0.976069,0.946417,0.943986,0.964748,0.987376,0.963537,0.997619,0.924868,0.96131,0.96131,0.952541,0.952054,0.969003,0.95992,0.971225,0.943227,0.948108,0.949409,0.945147,0.947735,0.981027,0.952541,0.983767,0.968565,0.968993,0.968618,0.810527,0.967678,0.988167,0.948663,0.966853,0.966853,0.979666,0.98942,0.981933,0.958139,0.944688,0.959517,0.952054,0.966443,0.972099,0.943153,0.932213,0.942481,0.956884,0.92942,0.972299,0.945985,0.959721,0.946658,0.936143,0.957854,0.93247,0.957854,0.934645,0.943039,0.934168,0.947337,0.942843,0.935315,0.96883,0.974992,0.952054,0.96883,0.952342,0.973049,0.940553,0.958139,0.949671,0.941565,0.958139,0.98651,0.938603,0.964785,0.955191,0.946198,0.964106,0.941276,0.99626,0.989558,0.990704,0.974978,0.995392,0.936705,0.946198,0.983126,0.952054,0.990664,0.955703,0.961789,0.979681,0.966443,0.950066,0.945985,0.945181,0.965625,0.975908,0.966443,0.956383,0.946675,0.957459,0.972117,0.959866,0.948687,0.941565,0.909735,0.961255,0.934904,0.933816,0.933234,0.933234,0.941565,0.966995,0.968993,0.96883,0.981021,0.96883,0.961981,0.968993,0.962355,0.947337,0.952054,0.980493,0.936618,0.933816,0.948663,0.944674,0.952054,0.952054,0.95209,0.944674,0.988344,0.963521,0.968845,0.905034,0.960173,0.98651,0.983759,0.95208,0.954853,0.96304,0.952054,0.959012,0.945238,0.946198,0.971566,0.979666,0.995402,0.983759,0.952582,0.968229,0.943598,0.948174,0.949409,0.979052,0.973317,0.963537,0.952284,0.954757,0.971566,0.959971,0.952054,0.943039,0.946796,0.947023,0.943855,0.946109,0.983759,0.807714,0.977824,0.949671,0.953822,0.946675,0.955703,0.942868,0.941565,0.961015,0.96208,0.991552,0.992602,0.981954,0.956985,0.971577,0.939783,0.944501,0.963521,0.973049,0.961818,0.945347,0.954324,0.955694,0.973049,0.957288,0.947337,0.922523,0.928216,0.935979,0.929125,0.935869,0.954029,0.963255,0.940259,0.931779,0.92034,0.928462,0.926796,0.922903,0.922427,0.910641,0.91981,0.926833,0.935847,0.927704,0.927815,0.926933,0.932521,0.926134,0.927807,0.939998,0.94978,0.928932,0.925195,0.926614,0.944828,0.920088,0.921515,0.934257,0.944833,0.96126,0.92248,0.929034,0.923236,0.91522,0.939111,0.918757,0.92405,0.927781,0.925224,0.935221,0.926744,0.920889,0.94276,0.936837,0.927712,0.922892,0.92022,0.951395,0.936025,0.934042,0.935519,0.944043,0.956169,0.928552,0.888097,0.929233,0.923646,0.895186,0.924249,0.928157,0.926435,0.933484,0.926725,0.938127,0.942591,0.95018,0.914409,0.94738,0.952683,0.924936,0.952797,0.938303,0.955304,0.935396,0.935186,0.926023,0.923267,0.91934,0.901911,0.942024,0.940273,0.944195,0.93854,0.933757,0.944759,0.936728,0.934979,0.932359,0.944262,0.930944,0.924886,0.932905,0.938182,0.943687,0.931801,0.943018,0.93324,0.928047,0.922165,0.939306,0.927073,0.930163,0.935884,0.912655,0.938609,0.95844,0.938955,0.937032,0.948516,0.920889,0.91351,0.923483,0.929944,0.951198,0.968431,0.932911,0.907057,0.917848,0.927002,0.922338,0.927046,0.935029,0.937562,0.943585
13057717,0.75257,0.166857,0.797752,0.511209,0.865449,0.331003,0.298758,0.474505,0.542941,0.649844,0.830035,0.598943,0.740634,0.710194,0.766767,0.694997,0.521895,0.467084,0.765303,0.603362,0.842879,0.694862,0.629468,0.762154,0.771461,0.805852,0.694997,0.680378,0.715589,0.901024,0.548175,0.642725,0.737051,0.670604,0.680378,0.774566,0.973672,0.758287,0.497455,0.680378,0.73978,0.921906,0.973672,0.961453,0.737051,0.973672,0.973422,0.559491,0.901101,0.973672,0.625015,0.537208,0.66686,0.77571,0.599077,0.805852,0.869082,0.875981,0.961453,0.694862,0.598943,0.887162,0.548175,0.865449,0.617933,0.73943,0.712463,0.790701,0.598943,0.850551,0.901024,0.62236,0.66686,0.668698,0.565938,0.830955,0.819153,0.737051,0.813018,0.657148,0.479277,0.849048,0.83241,0.654807,0.540967,0.827193,0.740634,0.87679,0.737051,0.680378,0.67591,0.733768,0.766612,0.798475,0.63492,0.63492,0.766612,0.562039,0.629468,0.803046,0.518405,0.918903,0.865449,0.67591,0.541208,0.617438,0.648744,0.486164,0.629468,0.106609,0.629468,0.743415,0.598943,0.942418,0.737051,0.872679,0.83229,0.633126,0.66686,0.657148,0.537457,0.629468,0.438227,0.722455,0.531454,0.599159,0.43301,0.732809,0.598943,0.485099,0.657283,0.469829,0.598943,0.619916,0.767994,0.579013,0.704155,0.661082,0.558333,0.727245,0.848874,0.805852,0.925463,0.920974,0.670235,0.914741,0.790701,0.840199,0.540967,0.507149,0.680614,0.827256,0.737051,0.9839,0.980013,0.876695,0.73943,0.912685,0.766612,0.598943,0.694997,0.894312,0.535765,0.892527,0.67591,0.680378,0.82991,0.7004,0.7004,0.681983,0.740634,0.574085,0.433431,0.483064,0.678307,0.767904,0.784211,0.913726,0.504547,0.553811,0.553811,0.598943,0.644157,0.805852,0.723921,0.68724,0.691521,0.571203,0.559491,0.91271,0.81058,0.737051,0.664293,0.876695,0.976971,0.521895,0.464527,0.706613,0.797752,0.521754,0.570582,0.598943,0.923209,0.952254,0.725537,0.781685,0.604909,0.7004,0.628698,0.453324,0.649844,0.759304,0.887162,0.682199,0.654807,0.553811,0.876695,0.864152,0.704155,0.680614,0.639694,0.643708,0.905517,0.541208,0.432911,0.432911,0.774566,0.836479,0.740634,0.740716,0.667036,0.548175,0.978243,0.553811,0.63492,0.886007,0.803046,0.912658,0.737051,0.701057,0.672538,0.774566,0.806037,0.934273,0.649844,0.760219,0.66686,0.643511,0.973451,0.864152,0.912685,0.963238,0.732809,0.968759,0.973672,0.790701,0.82991,0.737051,0.901024,0.680378,0.619916,0.73927,0.712463,0.88088,0.836479,0.559491,0.737051,0.851692,0.851692,0.598943,0.540967,0.521895,0.945113,0.759304,0.531454,0.642725,0.690012,0.805852,0.81058,0.781685,0.741856,0.783783,0.980026,0.694862,0.687632,0.737051,0.737051,0.476879,0.63492,0.809369,0.657753,0.740716,0.564489,0.582829,0.623862,0.804219,0.697462,0.771622,0.619916,0.438227,0.453324,0.504547,0.79622,0.559491,0.465385,0.496301,0.570582,0.7004,0.664293,0.664293,0.680378,0.629468,0.799827,0.551792,0.531454,0.705126,0.894406,0.694997,0.980087,0.886967,0.676367,0.676367,0.603021,0.598943,0.740716,0.664738,0.759304,0.525109,0.565938,0.57682,0.541168,0.562817,0.841293,0.603021,0.864215,0.737051,0.740634,0.737496,0.671869,0.729634,0.901024,0.570582,0.722732,0.722732,0.82991,0.9115,0.848874,0.649844,0.537333,0.661373,0.598943,0.719302,0.766612,0.524487,0.43298,0.518866,0.639348,0.675637,0.768285,0.548175,0.663079,0.553811,0.465854,0.647458,0.435125,0.647458,0.453324,0.523535,0.449329,0.559491,0.521895,0.249209,0.73927,0.790814,0.598943,0.118223,0.601357,0.132861,0.502737,0.649844,0.579013,0.511209,0.649844,0.887162,0.486426,0.705439,0.625185,0.549961,0.945999,0.911652,0.968712,0.912658,0.922238,0.790701,0.961453,0.904775,0.549961,0.858856,0.598943,0.921906,0.629468,0.680378,0.830035,0.719302,0.582313,0.548175,0.541449,0.712463,0.798475,0.719302,0.635151,0.553948,0.644157,0.766767,0.664293,0.57078,0.511209,0.585172,0.67591,0.455491,0.446385,0.441523,0.441523,0.511209,0.723921,0.740634,0.73927,0.841244,0.73927,0.681983,0.740634,0.685108,0.559491,0.598943,0.836826,0.469829,0.446385,0.570582,0.537208,0.598943,0.598943,0.599249,0.537208,0.902497,0.694862,0.739398,0.657283,0.66686,0.887162,0.864152,0.599159,0.62236,0.690839,0.598943,0.657148,0.917613,0.549961,0.762154,0.82991,0.961542,0.864152,0.603362,0.69245,0.528215,0.566486,0.57682,0.824771,0.776801,0.694997,0.600869,0.621556,0.762154,0.665171,0.598943,0.523535,0.554965,0.55686,0.530363,0.549214,0.864152,0.927858,0.814505,0.579013,0.613736,0.553948,0.629468,0.522106,0.511209,0.673896,0.682809,0.929335,0.938116,0.849048,0.640188,0.762251,0.496301,0.535765,0.694862,0.774566,0.680614,0.542841,0.617933,0.933344,0.774566,0.642725,0.559491,0.911797,0.892005,0.903684,0.895514,0.905456,0.94684,0.94891,0.913663,0.882938,0.880155,0.896614,0.89208,0.884011,0.883295,0.886672,0.886349,0.889923,0.88992,0.891233,0.891401,0.892283,0.898481,0.873251,0.891389,0.901837,0.927423,0.893082,0.887459,0.891813,0.916996,0.884512,0.881923,0.901092,0.918671,0.912296,0.866982,0.883026,0.884512,0.888181,0.895519,0.877774,0.885736,0.89135,0.887503,0.906382,0.858807,0.880981,0.911781,0.821883,0.891246,0.883995,0.882386,0.926876,0.905686,0.892092,0.894508,0.915816,0.801011,0.877402,0.89491,0.893535,0.868983,0.89296,0.886037,0.891915,0.879648,0.899929,0.843276,0.906915,0.898526,0.925049,0.864545,0.898581,0.928814,0.90262,0.945415,0.909057,0.932756,0.902806,0.90249,0.888705,0.884559,0.87865,0.886571,0.900519,0.91195,0.892443,0.89454,0.900341,0.916892,0.90481,0.874681,0.900282,0.892571,0.896108,0.847936,0.899058,0.906997,0.915281,0.897397,0.901305,0.899563,0.89175,0.907545,0.908689,0.890286,0.894934,0.90913,0.898995,0.907641,0.938732,0.908161,0.905268,0.940465,0.870574,0.86988,0.884883,0.894605,0.928054,0.928699,0.899068,0.883124,0.876406,0.890179,0.812421,0.843964,0.888515,0.906065,0.915126
13308163,0.767487,0.846338,0.803048,0.540677,0.873561,0.718463,0.648029,0.530707,0.170498,0.251666,0.193458,0.246245,0.282277,0.00465,0.780829,0.713385,0.550719,0.499213,0.779452,0.627275,0.852351,0.713259,0.651807,0.776494,0.785239,0.817557,0.713385,0.699648,0.732736,0.906991,0.575415,0.664265,0.752904,0.683134,0.699648,0.788157,0.97526,0.772859,0.527753,0.699648,0.788699,0.926614,0.97526,0.963777,0.752904,0.97526,0.975024,0.586049,0.907063,0.97526,0.647622,0.56511,0.686945,0.789232,0.623249,0.817557,0.876975,0.883458,0.963777,0.713259,0.623122,0.893965,0.575415,0.873561,0.640968,0.749342,0.729798,0.80332,0.623122,0.859561,0.906991,0.645128,0.686945,0.688672,0.592107,0.841146,0.830056,0.752904,0.824291,0.677818,0.510671,0.858149,0.842513,0.675618,0.568641,0.837611,0.756271,0.884218,0.752904,0.699648,0.695449,0.749819,0.780682,0.810624,0.65693,0.65693,0.780682,0.588443,0.651807,0.81492,0.54744,0.917874,0.873561,0.695449,0.568868,0.640502,0.669921,0.547937,0.651807,0.718463,0.651807,0.758884,0.246245,0.941688,0.752904,0.880355,0.842402,0.655245,0.686945,0.154318,0.565343,0.651807,0.472096,0.739188,0.559702,0.623326,0.467193,0.748917,0.623122,0.516142,0.677945,0.501793,0.623122,0.642831,0.781981,0.604394,0.721991,0.681515,0.584961,0.743689,0.857985,0.817557,0.929957,0.925739,0.690116,0.913659,0.80332,0.764389,0.568641,0.536863,0.699869,0.837671,0.752904,0.984871,0.981218,0.884129,0.644412,0.911577,0.780682,0.623122,0.713385,0.900684,0.563753,0.899007,0.695449,0.699648,0.840165,0.718463,0.718463,0.701156,0.756271,0.599763,0.467589,0.514229,0.697701,0.781896,0.797221,0.918928,0.534417,0.580712,0.580712,0.623122,0.665611,0.817557,0.740566,0.706096,0.710119,0.597054,0.586049,0.917973,0.822,0.752904,0.684532,0.884129,0.978359,0.550719,0.49681,0.724301,0.803048,0.550587,0.596472,0.623122,0.922234,0.955132,0.742084,0.794847,0.628729,0.718463,0.651084,0.486283,0.670955,0.773815,0.893965,0.701359,0.675618,0.580712,0.884129,0.872342,0.721991,0.699869,0.661416,0.665188,0.911213,0.568868,0.4671,0.4671,0.788157,0.846338,0.756271,0.756348,0.68711,0.575415,0.979555,0.580712,0.65693,0.892879,0.81492,0.917923,0.752904,0.71908,0.692281,0.788157,0.817731,0.933439,0.670955,0.774676,0.686945,0.659118,0.975052,0.872342,0.911577,0.965454,0.748917,0.970643,0.97526,0.80332,0.840165,0.752904,0.906991,0.699648,0.642831,0.754989,0.729798,0.888061,0.846338,0.586049,0.752904,0.860633,0.860633,0.623122,0.568641,0.550719,0.948422,0.773815,0.559702,0.664265,0.701804,0.817557,0.822,0.794847,0.757419,0.796818,0.98123,0.713259,0.625599,0.752904,0.752904,0.508417,0.65693,0.820862,0.678387,0.756348,0.590745,0.607979,0.646539,0.816023,0.715702,0.785391,0.642831,0.472096,0.486283,0.534417,0.801556,0.586049,0.497616,0.526668,0.596472,0.718463,0.684532,0.684532,0.699648,0.651807,0.811895,0.578814,0.559702,0.722903,0.900772,0.713385,0.981287,0.885534,0.695879,0.695879,0.626954,0.623122,0.756348,0.68495,0.773815,0.55374,0.592107,0.602333,0.56883,0.589175,0.850861,0.626954,0.872401,0.752904,0.756271,0.753322,0.687345,0.745934,0.906991,0.596472,0.739449,0.739449,0.840165,0.916835,0.857985,0.670955,0.565226,0.681789,0.623122,0.736225,0.780682,0.553155,0.467165,0.547873,0.661091,0.565942,0.782255,0.575415,0.683392,0.580712,0.498058,0.668712,0.46918,0.668712,0.486283,0.55226,0.482528,0.586049,0.550719,0.491545,0.754989,0.803425,0.623122,0.754989,0.62539,0.788157,0.532716,0.670955,0.604394,0.540677,0.670955,0.893965,0.517389,0.723198,0.647783,0.577094,0.945313,0.910532,0.970598,0.917923,0.926926,0.80332,0.963777,0.903567,0.577094,0.867365,0.623122,0.926614,0.651807,0.699648,0.840282,0.736225,0.607495,0.575415,0.569095,0.729798,0.810624,0.736225,0.657147,0.58084,0.665611,0.780829,0.684532,0.596657,0.540677,0.604737,0.695449,0.488319,0.479762,0.475193,0.475193,0.540677,0.740566,0.756271,0.754989,0.850815,0.754989,0.701156,0.756271,0.704092,0.586049,0.623122,0.846663,0.501793,0.479762,0.596472,0.56511,0.623122,0.623122,0.62341,0.56511,0.908375,0.713259,0.755109,0.677945,0.686945,0.893965,0.872342,0.623326,0.645128,0.709478,0.623122,0.677818,0.916567,0.577094,0.776494,0.840165,0.96386,0.872342,0.627275,0.750266,0.556658,0.592622,0.602333,0.835336,0.790257,0.713385,0.624932,0.644372,0.776494,0.685358,0.623122,0.55226,0.581796,0.583576,0.558677,0.576392,0.872342,0.926943,0.825688,0.604394,0.637023,0.58084,0.651807,0.550918,0.540677,0.693556,0.701932,0.281561,0.62493,0.858149,0.66188,0.776585,0.526668,0.563753,0.713259,0.788157,0.699869,0.570403,0.640968,0.932499,0.788157,0.664265,0.586049,0.910678,0.890635,0.902462,0.894189,0.904257,0.946166,0.948261,0.912568,0.885067,0.865796,0.895302,0.890711,0.882539,0.881815,0.886081,0.884907,0.873987,0.891922,0.875487,0.890024,0.890916,0.897194,0.887462,0.890011,0.908585,0.926502,0.880271,0.873975,0.876151,0.915943,0.883047,0.880425,0.899838,0.917639,0.936047,0.881896,0.89614,0.883047,0.900717,0.883034,0.876224,0.884287,0.889971,0.886076,0.895165,0.873834,0.879471,0.907131,0.881038,0.878216,0.882524,0.880894,0.925948,0.904489,0.89951,0.90176,0.914748,0.933222,0.865434,0.893577,0.866717,0.883672,0.887317,0.872382,0.890544,0.887922,0.89866,0.873802,0.86885,0.912535,0.835776,0.899768,0.898918,0.899703,0.898306,0.856044,0.928112,0.931903,0.901573,0.890807,0.887293,0.883094,0.877111,0.872981,0.911672,0.910833,0.914979,0.906363,0.899077,0.915838,0.903603,0.900939,0.888334,0.915081,0.89479,0.849482,0.897778,0.88357,0.903016,0.896096,0.91493,0.887529,0.890376,0.906372,0.907531,0.888894,0.893601,0.907978,0.897713,0.906469,0.937954,0.897157,0.904067,0.939709,0.879471,0.868229,0.883423,0.893268,0.927142,0.963605,0.884456,0.879645,0.874838,0.888785,0.844376,0.888853,0.888103,0.89481,0.813154


In [15]:
data_matrix = np.array(data_matrix)

gb_raw_shape = data_matrix.shape
print(gb_raw_shape)

gb_data = []
for i in range(gb_raw_shape[1]):
    gb_data.extend(data_matrix[:, i, :])
gb_data = np.array(gb_data)
print(gb_data.shape)

project_numbers = np.array(list(range(1, gb_raw_shape[0] + 1)) * gb_raw_shape[1])

project_numbers = np.array(list(range(1, gb_raw_shape[0] + 1)) * gb_raw_shape[1])

# get the projects for lowest predictions for each publication with distance matrix
for num_top in range(10, 0, -1):
    project_numbers_pred = []
    for i in range(len(train_pub_data), distance_matrix.shape[1]):
        project_numbers_pred.append(list(np.argsort(distance_matrix[:, i] + 1))[:num_top])

    project_lists = []
    for i in range(0, gb_data.shape[0], gb_raw_shape[0]):
        pub_belongs = gb_data[i:i + gb_raw_shape[0], 0] * project_numbers[i:i + gb_raw_shape[0]]
        project = sorted(list(pub_belongs[pub_belongs != 0].astype(int)), reverse=True)
        project_lists.append(project)

    project_lists_test = project_lists[len(train_pub_data):]

    # calculate accuracy
    # use y_test as mask for project_numbers_test
    accuracy_list = []
    for i, project_list in enumerate(list(project_lists_test)):
        ratio = len(set(project_numbers_pred[i]) & set(project_list)) / len(set(project_list))
        accuracy_list.append(ratio)

    accuracy = sum(accuracy_list) / len(accuracy_list)
    print(accuracy)

(225, 635, 2)
(142875, 2)
0.16279069767441862
0.13178294573643412
0.10077519379844961
0.10077519379844961
0.07751937984496124
0.06976744186046512
0.06976744186046512
0.046511627906976744
0.031007751937984496
0.031007751937984496
