In [1]:
from bertopic import BERTopic
from sklearn.metrics.pairwise import cosine_similarity
from scipy.spatial.distance import jensenshannon
import pandas as pd
import numpy as np
import json



  from .autonotebook import tqdm as notebook_tqdm


In [2]:
with open('dim_sample.json') as f:
    all_data = json.load(f)

def get_unique_dis(data):
    disciplines = set()
    for pro_id in data.keys():
        disciplines.update(data[pro_id]['disciplines'])
    return disciplines

In [3]:
split = 180
train_data = {k: all_data[k] for k in list(all_data.keys())[:split]}
test_data = {k: all_data[k] for k in list(all_data.keys())[split:]}

train_project_data = {}
train_pub_data = []
for pro_id in train_data.keys():
    train_project_data[pro_id] = (train_data[pro_id]['abstract'], train_data[pro_id]['disciplines'])
    for pub_id in train_data[pro_id]['publications'].keys():
        train_pub_data.append((pub_id, train_data[pro_id]['publications'][pub_id]['abstract'], train_data[pro_id]['publications'][pub_id]['disciplines']))

test_project_data = {}
test_pub_data = []
for pro_id in test_data.keys():
    test_project_data[pro_id] = (test_data[pro_id]['abstract'], test_data[pro_id]['disciplines'])
    for pub_id in test_data[pro_id]['publications'].keys():
        test_pub_data.append((pub_id, test_data[pro_id]['publications'][pub_id]['abstract'], test_data[pro_id]['publications'][pub_id]['disciplines']))

print(len(train_project_data), len(train_pub_data))
print(len(test_project_data), len(test_pub_data))
print(len(get_unique_dis(train_data)), len(get_unique_dis({pub[0]: {'disciplines': pub[2]} for pub in train_pub_data})))

180 506
45 129
170 170


In [4]:
train_docs = [project[0] for project in train_project_data.values()] + [pub[1] for pub in train_pub_data]
test_docs = [project[0] for project in test_project_data.values()] + [pub[1] for pub in test_pub_data]

In [5]:
topic_model = BERTopic(language="english", calculate_probabilities=True, verbose=True)
topics, probs = topic_model.fit_transform(train_docs)

2024-06-16 19:28:33,619 - BERTopic - Embedding - Transforming documents to embeddings.
Batches: 100%|██████████| 22/22 [00:08<00:00,  2.51it/s]
2024-06-16 19:28:44,660 - BERTopic - Embedding - Completed ✓
2024-06-16 19:28:44,661 - BERTopic - Dimensionality - Fitting the dimensionality reduction algorithm




2024-06-16 19:28:50,487 - BERTopic - Dimensionality - Completed ✓
2024-06-16 19:28:50,488 - BERTopic - Cluster - Start clustering the reduced embeddings
2024-06-16 19:28:50,536 - BERTopic - Cluster - Completed ✓
2024-06-16 19:28:50,539 - BERTopic - Representation - Extracting topics from clusters using representation models.
2024-06-16 19:28:50,682 - BERTopic - Representation - Completed ✓


In [7]:
project_abstracts = [project[0] for project in train_project_data.values()] + [project[0] for project in test_project_data.values()]
pub_abstracts = [pub[1] for pub in train_pub_data] + [pub[1] for pub in test_pub_data]

project_matrix = topic_model.approximate_distribution(project_abstracts)[0]

pub_matrix = topic_model.approximate_distribution(pub_abstracts)[0]

100%|██████████| 1/1 [00:00<00:00,  3.22it/s]
100%|██████████| 1/1 [00:00<00:00,  1.34it/s]


In [8]:
distance_matrix = np.zeros((len(project_matrix), len(pub_matrix)))

for i in range(len(project_matrix)):
    for j in range(len(pub_matrix)):
        distance_matrix[i, j] = 1 - cosine_similarity([project_matrix[i]], [pub_matrix[j]])[0][0]

distance_matrix.shape

(225, 635)

In [12]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
# create a dataframe with row indices as project ids and column indices as publication ids
# if publication is in project, then 1, else 0
# if publication date is before project start date, then 0, else 1
# ratio of intersection of organisations from project and publication to organisations from publication
# ratio of intersection of authors from project and publication to authors from publication

all_data = {**train_data, **test_data}
pub_data = []
for pro_id in all_data.keys():
    for pub_id in all_data[pro_id]['publications'].keys():
        pub_data.append((pub_id, all_data[pro_id]['publications'][pub_id]))

data_matrix = [[0.] * len(pub_data) for _ in range(len(all_data))]
for i, pro_id in enumerate(all_data.keys()):
    for j, pub_id in enumerate([pub[0] for pub in pub_data]):
        belongs = 1 if pub_id in all_data[pro_id]['publications'].keys() else 0
        distance = distance_matrix[i, j]
        data_matrix[i][j] = [belongs, distance]

df = pd.DataFrame(distance_matrix, index=all_data.keys(), columns=[pub[0] for pub in pub_data])
df.to_csv('distance_bert_dim_abstract.csv')
df.head()

Unnamed: 0,10.3389/fmars.2023.1254461,10.1007/978-3-031-49133-7_8,10.1007/978-3-031-43619-2_15,10.1080/11663081.2023.2246863,10.1177/03057356231165327,10.1016/j.jconrel.2024.05.037,10.1007/s13346-024-01618-6,10.1002/smll.202303682,10.1371/journal.pone.0298895,10.1007/s00334-024-00992-y,10.1038/s41598-023-44445-4,10.1101/2023.09.15.557939,10.1016/j.jasrep.2023.104204,10.1016/j.palaeo.2023.111655,10.1007/jhep05(2024)154,10.1140/epjc/s10052-024-12711-y,10.1140/epjc/s10052-024-12416-2,10.1140/epjc/s10052-024-12415-3,10.1007/jhep02(2024)124,10.1007/jhep11(2023)103,10.1007/jhep06(2023)086,10.1093/iob/obad026,10.1007/s00359-023-01629-7,10.1101/2023.03.11.531676,10.1093/mnras/stae997,10.1093/mnras/stae616,10.1051/0004-6361/202348958,10.1093/mnras/stad3163,10.1093/mnras/stad2183,10.1101/2024.01.14.574481,10.1007/s40313-024-01095-9,10.1109/tpwrs.2023.3321700,10.1109/tits.2024.3392914,10.1007/978-981-97-0989-2_24,10.1109/tsc.2023.3332701,10.1007/978-3-031-48424-7_15,10.1007/978-3-031-48424-7_13,10.1145/3631353,10.1145/3629517,10.1109/icdcs57875.2023.00111,10.1109/icws60048.2023.00056,10.1109/icws60048.2023.00031,10.1109/icws60048.2023.00068,10.1109/tsc.2023.3307143,10.1145/3600232,10.1109/mic.2023.3267266,10.1109/tsc.2023.3241975,10.1109/tmc.2022.3230856,10.1007/978-3-031-20984-0_9,10.1109/tsc.2022.3160469,10.3389/fneur.2023.1182561,10.1038/s41598-024-57498-w,10.1016/j.jmrt.2023.11.014,10.1016/j.jmst.2023.05.020,10.1016/j.fuel.2023.130187,10.1017/9781009297349,10.1007/s11229-023-04282-4,10.3390/rel14060758,10.1002/smsc.202400096,10.1016/j.actpsy.2024.104252,10.1080/02691728.2024.2326828,10.5964/ejop.12031,10.1111/jopy.12805,10.1109/lsp.2023.3277792,10.21203/rs.3.rs-3644422/v1,10.1016/j.renene.2024.120101,10.1093/rheumatology/kead301,10.1097/mlr.0000000000002000,10.1111/tmi.13827,10.1063/5.0167167,10.1021/acsami.2c19376,10.1021/acsanm.2c05047,10.1101/2024.05.21.595254,10.1038/s41467-024-47964-4,10.1093/jb/mvae021,10.1016/j.neuron.2024.01.014,10.1016/j.isci.2023.107385,10.1016/j.peptides.2023.171051,10.3389/fphar.2023.1138666,10.3389/fphar.2023.1098976,10.1186/s43058-023-00521-4,10.1177/26334895231199467,10.1002/adom.202303199,10.1002/adom.202301232,10.1016/j.energy.2024.130322,10.1126/sciimmunol.abo4365,10.1515/sem-2023-0178,10.1364/boe.506664,10.1364/boe.494585,10.3847/1538-4357/ac4601,10.1371/journal.pone.0284416,10.1080/07350015.2023.2271039,10.1093/mnras/stae385,10.1093/mnras/stad2760,10.1002/ange.202320045,10.1002/anie.202320045,10.1016/j.chembiol.2024.02.012,10.1101/2023.11.29.569293,10.1038/s41467-023-41197-7,10.35772/ghm.2023.01065,10.3390/v15040896,10.1111/dar.13836,10.1063/5.0153862,10.1109/imoc57131.2023.10379741,10.1109/imoc57131.2023.10379729,10.1109/access.2023.3339563,10.1109/ojpel.2023.3339014,10.1109/csci58124.2022.00203,10.1016/j.ssci.2022.105967,10.1007/978-3-031-06015-1_8,10.1101/2023.01.19.524726,10.1007/s00382-023-07058-1,10.1002/oa.3284,10.1136/bmjopen-2023-080603,10.1101/2023.08.02.551649,10.1099/mgen.0.000965,10.2140/ant.2022.16.2005,10.1103/physrevlett.132.103402,10.21468/scipostphys.15.2.068,10.1080/02606755.2023.2213550,10.3390/rs15204928,10.1063/5.0203603,10.1103/physrevapplied.21.054027,10.1109/icecom58258.2023.10367924,10.1109/icecom58258.2023.10367934,10.1109/icecom58258.2023.10367938,10.1109/icecom58258.2023.10367923,10.1109/metamaterials58257.2023.10289546,10.23919/ursigass57860.2023.10265525,10.1109/elmar59410.2023.10253914,10.1002/pen.26771,10.1016/j.canep.2023.102451,10.3390/biomedicines11051344,10.3390/pharmaceutics15010181,10.1037/fam0001189,10.3390/su15129371,10.1038/s44221-024-00208-7,10.1093/evolut/qpae036,10.1093/evolut/qpae024,10.3390/micro4010008,10.3390/molecules28196822,10.1007/s11673-023-10285-0,10.1021/acsnano.3c09776,10.1101/2023.09.08.556607,10.1016/j.snb.2023.133733,10.1016/j.ocecoaman.2023.106961,10.1016/j.tre.2023.103169,10.1016/j.elerap.2023.101336,10.1590/0001-3765202320230351,10.1590/s1678-3921.pab2023.v58.03246,10.1038/s41598-024-56540-1,10.1364/ol.494369,10.1017/s0963180124000112,10.1136/jme-2023-109568,10.1111/japp.12655,10.1038/s41539-023-00170-1,10.1016/j.neubiorev.2023.105153,10.1007/s00158-023-03663-0,10.3390/ma16145076,10.1007/978-3-031-55260-1_15,10.1007/s11228-024-00719-1,10.1007/s00205-023-01948-8,10.1142/s0219199723500657,10.1007/s12220-023-01484-7,10.1007/s10957-023-02344-8,10.1007/978-3-031-46359-4_2,10.1007/s10208-023-09629-4,10.1007/s00245-023-10029-x,10.1007/s00028-023-00902-1,10.1016/j.jde.2023.06.004,10.1007/s00030-023-00857-9,10.1007/s11579-023-00333-z,10.1061/jmenea.meeng-5794,10.1177/21695067231194338,10.1038/s41597-024-03034-4,10.1039/d3ew00347g,10.1101/2024.05.17.24307550,10.1101/2024.01.09.24301073,10.1038/s41598-023-41853-4,10.1111/sjos.12685,10.1038/s41593-023-01321-8,10.1016/j.jclinepi.2023.02.020,10.1371/journal.pone.0280192,10.1016/j.jbi.2022.104243,10.1016/j.eclinm.2022.101724,10.38107/037,10.1002/adfm.202314696,10.1063/5.0168129,10.1103/physrevmaterials.7.064202,10.1038/s41699-023-00404-1,10.1061/jsendh.steng-12655,10.1186/s40623-023-01940-2,10.1029/2022ja031231,10.1029/2023ja031663,10.1029/2022gl101465,10.21203/rs.3.rs-4345687/v1,10.1093/toxsci/kfae021,10.1101/2023.08.28.555101,10.1103/physrevb.109.205125,10.1111/cgf.14942,10.1109/tpami.2022.3163720,10.1016/j.csl.2024.101623,10.1039/d0sc01737j,10.1186/s12889-023-17570-y,10.1080/13218719.2023.2243303,10.5694/mja2.52089,10.1177/00938548231170799,10.1007/s11150-024-09710-z,10.1016/j.jbankfin.2023.107047,10.1016/j.euroecorev.2023.104632,10.1038/s41598-023-30724-7,10.1038/s41598-023-29536-6,10.1111/obes.12545,10.1016/j.jebo.2022.11.027,10.3389/fimmu.2023.1060258,10.1016/j.jhydrol.2024.130983,10.1101/2024.03.18.585583,10.1016/j.celrep.2024.113675,10.1103/physrevx.14.021017,10.1038/s41559-024-02331-w,10.1016/j.gloplacha.2024.104354,10.1038/s41467-023-41685-w,10.1126/sciadv.adg7679,10.1144/sp532-2022-1,10.1523/jneurosci.0226-23.2023,10.1101/2023.01.11.523491,10.1073/pnas.2309379120,10.1073/pnas.2301947120,10.1038/s41467-024-48673-8,10.1038/s41467-024-47953-7,10.1016/j.fsigen.2024.103048,10.1093/bib/bbad163,10.1101/2023.12.12.570420,10.1016/j.celrep.2023.113331,10.1103/physrevd.108.105013,10.1007/jhep11(2023)005,10.1101/2024.01.29.574039,10.1126/scitranslmed.adi9711,10.3390/cancers15143723,10.1021/acsnano.3c11337,10.1038/s41467-023-36133-8,10.1016/j.cobme.2024.100547,10.1002/ange.202319567,10.1002/anie.202319567,10.1016/j.jfca.2023.105901,10.1016/j.foodcont.2023.109969,10.1016/j.respol.2024.104954,10.1371/journal.pbio.3002513,10.1109/qce57702.2023.00111,10.1109/iccad57390.2023.10323863,10.1016/j.ic.2023.105077,10.1145/3582016.3582039,10.1109/tcad.2022.3179223,10.1145/3517145,10.1016/j.tcs.2022.02.017,10.1145/3514355,10.1145/3514239,10.1038/s41598-024-51799-w,10.3390/cells12242815,10.5771/9783748935544,10.1016/j.eswa.2024.124100,10.1016/j.frl.2024.105308,10.12688/openreseurope.16436.1,10.12688/openreseurope.16278.1,10.12688/openreseurope.15386.1,10.3390/foods12244484,10.1057/s42984-024-00090-3,10.1002/anie.202315985,10.1002/ange.202315985,10.1161/atvbaha.123.319821,10.1093/cvr/cvad149,10.1161/strokeaha.123.042714,10.1016/j.jtha.2023.04.002,10.1182/bloodadvances.2023010100,10.3389/fphar.2024.1379236,10.1101/2023.07.03.547532,10.1103/physreve.107.l052602,10.1063/5.0133871,10.1109/icnwc57852.2023.10127328,10.1016/j.atech.2023.100265,10.1016/j.cct.2023.107387,10.1155/2023/2397564,10.1007/s10502-024-09441-1,10.1111/gcb.16637,10.3390/ma16051978,10.21203/rs.3.rs-4271873/v1,10.1038/s41419-024-06693-8,10.1038/s41598-024-56928-z,10.1016/j.chemgeo.2024.122157,10.1016/j.chemgeo.2022.121064,10.2343/geochemj.gj22004,10.1016/j.jwpe.2023.104395,10.1016/j.jece.2023.111107,10.1080/02614367.2022.2162109,10.1109/twc.2024.3400601,10.1109/globecom54140.2023.10437972,10.1109/twc.2023.3344802,10.1109/tifs.2023.3268443,10.1093/ptep/ptae021,10.1021/accountsmr.4c00071,10.26434/chemrxiv-2024-hvxml,10.1039/d4nr01024h,10.1038/s42004-024-01143-0,10.1039/d3dd00236e,10.1039/d3tc03606e,10.1021/acs.chemmater.3c01744,10.1021/acs.inorgchem.3c02337,10.1063/5.0144827,10.1002/anie.202314378,10.1002/ange.202314378,10.1039/d3ta04707e,10.1039/d3ce00881a,10.1002/asia.202300673,10.1038/s41467-023-38737-6,10.26434/chemrxiv-2023-d1s8w,10.1002/adma.202211478,10.1145/3589334.3645329,10.1029/2023gl104396,10.20396/cel.v65i00.8673331,10.1016/j.procs.2023.08.230,10.1371/journal.pbio.3001984,10.1101/2022.04.22.489138,10.1002/brb3.3490,10.1016/j.clinph.2024.04.002,10.1111/ejn.16001,10.3389/fneur.2023.1177589,10.1016/j.clinph.2022.08.015,10.1101/2024.05.23.24307833,10.1093/ofid/ofad655,10.1093/ofid/ofae018,10.1371/journal.pone.0297775,10.21203/rs.3.rs-2640564/v3,10.1002/saj2.20688,10.1071/sr23164,10.1029/2023gl104852,10.1038/s41598-022-10957-8,10.1186/s40623-022-01584-8,10.1111/nph.19336,10.3389/fpsyg.2022.1014713,10.3390/v15102029,10.3389/fnut.2023.1215768,10.3390/educsci13080838,10.12688/routledgeopenres.17798.2,10.12688/routledgeopenres.17798.1,10.1080/00031305.2023.2232006,10.1080/0969725x.2023.2270357,10.1177/00345237231183343,10.1016/j.ijheatmasstransfer.2023.124665,10.1039/d3qm01106b,10.1016/j.mechmachtheory.2023.105508,10.1016/j.scib.2024.02.010,10.1088/1674-4527/ace179,10.1126/science.abl7759,10.1016/j.scitotenv.2024.172840,10.1016/j.envint.2024.108601,10.1016/j.envint.2024.108454,10.1016/j.envint.2023.108375,10.1016/j.envres.2023.117611,10.1016/j.envres.2023.117832,10.2337/dc23-0327,10.1021/acs.est.3c02765,10.1021/acs.est.3c00848,10.1007/s40726-023-00269-4,10.1021/acs.analchem.3c00376,10.1289/ehp11372,10.1101/2023.02.09.527886,10.3390/make6020035,10.1016/j.micromeso.2024.113042,10.3390/make6010014,10.1016/j.compag.2024.108650,10.1038/s41598-023-34320-7,10.1016/j.compag.2022.107325,10.1145/3615894.3628507,10.1016/j.scs.2023.104435,10.1093/jipm/pmac028,10.1145/3651171,10.1016/j.clsr.2024.105934,10.1145/3594739.3605113,10.1093/lambio/ovae041,10.1007/s12155-024-10734-7,10.1016/j.carres.2024.109068,10.1007/s00253-023-12908-3,10.1007/s00289-024-05152-w,10.3390/polysaccharides4020013,10.3389/fagro.2023.1148969,10.1038/s41586-024-07473-2,10.1101/2023.11.30.569198,10.1186/s13015-024-00254-6,10.1007/978-1-0716-3989-4_3,10.4230/lipics.wabi.2023.17,10.1186/s13015-024-00261-7,10.1101/2023.11.22.568259,10.1093/gbe/evad205,10.1101/gr.277679.123,10.1101/2023.06.21.545862,10.1145/3571723,10.1101/2023.05.12.540616,10.1101/2023.03.02.530874,10.1101/2023.01.30.526175,10.1101/2022.12.23.521809,10.1038/s41390-023-02992-6,10.1001/jama.2023.20358,10.1542/hpeds.2023-007246,10.1016/j.jpeds.2023.113499,10.1093/jamia/ocad053,10.1093/jamia/ocac251,10.1038/s41598-024-54655-z,10.1172/jci175031,10.3389/fgene.2023.1304425,10.1186/s13578-023-01102-7,10.1016/j.gendis.2022.11.003,10.1002/mp.16880,10.1002/mp.16352,10.1016/j.scitotenv.2022.158267,10.1016/j.foreco.2022.120301,10.1016/j.ecolind.2022.109004,10.1073/pnas.2318333121,10.1063/5.0158930,10.1145/3588432.3591521,10.1063/5.0142166,10.1038/s41467-024-46494-3,10.1128/mbio.02479-23,10.1101/2023.09.08.556855,10.1101/2023.08.31.555785,10.1186/s40168-022-01378-w,10.1101/2023.12.18.572279,10.1093/nar/gkad1164,10.1101/2023.12.03.569795,10.1101/2023.07.26.550759,10.1186/s12864-023-09265-w,10.1021/acsanm.3c05701,10.1016/j.apsusc.2023.158316,10.1080/03057240.2024.2333577,10.3390/rel14121517,10.3390/rel14111427,10.1109/icops45740.2023.10480948,10.1109/icops45740.2023.10481052,10.1109/icops45740.2023.10481130,10.1038/s41598-024-51298-y,10.1109/ppc47928.2023.10311041,10.1109/ppc47928.2023.10310918,10.1049/hve2.12382,10.21203/rs.3.rs-3143506/v1,10.4271/03-16-08-0061,10.1080/02560046.2024.2316302,10.1177/01634437231219141,10.1177/16094069231182015,10.1177/00113921231182182,10.1002/cjce.25286,10.1080/07373937.2024.2318437,10.1016/j.etap.2024.104382,10.1080/19440049.2023.2283769,10.3390/ani13152499,10.1016/j.jet.2024.105798,10.1038/s41467-023-41107-x,10.1016/j.oneear.2023.05.006,10.1088/1748-9326/acd5e8,10.1088/1748-9326/aca815,10.1145/3617232.3624856,10.1109/cloudcom59040.2023.00047,10.1007/s11761-024-00391-1,10.1109/percomworkshops56833.2023.10150370,10.1016/j.comcom.2023.04.027,10.1109/apsec57359.2022.00034,10.1109/cloudcom55334.2022.00016,10.1371/journal.pone.0285434,10.1186/s13578-023-01012-8,10.1161/strokeaha.122.041651,10.1080/15534510.2023.2279662,10.1111/nana.12994,10.1080/14680777.2023.2258298,10.1038/s41598-023-35252-y,10.1177/10596011231193176,10.1016/j.jhin.2023.03.002,10.1177/10596011221150756,10.1080/08039488.2024.2322495,10.1007/s00787-024-02406-w,10.1142/s0219877024500275,10.1155/2023/2516746,10.1080/08039488.2023.2222698,10.3389/fpsyg.2023.1183704,10.1111/acer.15119,10.1080/20008066.2023.2191396,10.1007/s00787-022-02107-2,10.1007/s11218-022-09734-2,10.1016/j.rssm.2023.100876,10.3390/f15020354,10.1007/s11629-023-8914-3,10.14746/quageo-2023-0016,10.18146/view.297,10.18146/tmg.835,10.5117/9789463727815,10.1177/08912424231163485,10.1007/978-94-6265-515-7,10.1038/s41467-023-41057-4,10.1093/gigascience/giad047,10.1038/s41592-023-01886-z,10.1093/nar/gkad289,10.1101/2023.01.21.525030,10.1016/j.gpb.2022.09.011,10.1021/acs.jpcb.4c01987,10.1021/acs.jctc.3c00663,10.1021/acs.jpcb.3c04473,10.26434/chemrxiv-2023-w0h1p,10.1073/pnas.2305899120,10.1101/2023.05.01.538927,10.1101/2023.12.22.23300430,10.1002/agt2.386,10.1002/adfm.202214179,10.1109/milcom58377.2023.10356332,10.1101/2024.05.03.24306699,10.1101/2024.04.16.24305925,10.1101/2023.10.25.23297571,10.3389/fphys.2023.1202186,10.1103/physrevb.109.205301,10.1103/physrevb.108.195303,10.1523/eneuro.0197-23.2023,10.3390/v15091897,10.1016/j.prdoa.2024.100251,10.3390/ijms24108995,10.3390/ijms24032247,10.1016/j.isci.2023.108171,10.1158/2326-6066.cir-23-0496,10.1101/2023.12.07.570715,10.1016/j.cell.2023.11.008,10.1093/abt/tbad025,10.1016/j.celrep.2023.113280,10.1101/2023.06.18.545488,10.3390/cancers15102788,10.1101/2023.03.07.531525,10.1080/13543784.2023.2179482,10.1016/j.bbrc.2022.09.019,10.3389/fimmu.2022.996026,10.1111/liv.15927,10.1101/2023.11.17.23298672,10.1111/liv.15665,10.1016/j.cgh.2023.04.016,10.1016/j.jhepr.2022.100667,10.1007/s11914-023-00843-1,10.1007/s11914-023-00842-2,10.1007/s11914-023-00855-x,10.3390/rs15235545,10.1029/2022gl102689,10.3390/rs14236069,10.1038/s41467-024-46327-3,10.1002/cam4.6761,10.3389/fonc.2023.1100585,10.1109/vtc2023-fall60731.2023.10333522,10.1128/jvi.00100-23,10.1021/acs.jpcc.3c05477,10.1021/acsaem.3c01370,10.3389/fnins.2023.1217993,10.1016/j.visres.2023.108296,10.1016/j.jad.2023.07.014,10.1001/jamanetworkopen.2023.17905,10.1007/s00371-024-03454-8,10.1109/smc53992.2023.10394105,10.1007/s00521-023-09367-2,10.1145/3582700.3582707,10.1007/s10803-024-06302-9,10.1016/j.psychres.2024.115838,10.1016/j.rasd.2024.102339,10.1177/13623613231213543,10.1007/s10803-023-06039-x,10.1016/j.jplph.2023.154138,10.1016/j.freeradbiomed.2024.04.217,10.1016/j.freeradbiomed.2023.06.021,10.1093/jncimonographs/lgad014,10.1038/s41467-023-37269-3,10.1111/liv.15893,10.1101/2023.04.25.538102,10.1063/5.0142200,10.1016/b978-0-323-95124-1.00017-6,10.1101/2023.05.17.541187,10.1101/2023.05.17.541174,10.1007/s00415-024-12430-0,10.1093/ntr/ntae084,10.1093/schbul/sbae024,10.1038/s41386-024-01842-1,10.21203/rs.3.rs-3168186/v1,10.1101/2023.08.21.23294348,10.1038/s41380-023-02165-1,10.1136/bmjopen-2022-066249,10.1038/s41585-024-00869-9,10.1158/0008-5472.can-23-0555,10.1101/2022.11.02.514910,10.3390/s24072335,10.1109/sensors56945.2023.10324963,10.1038/s41528-023-00258-z,10.3390/bios12050322,10.1371/journal.pone.0288803,10.3389/fpubh.2023.1219676,10.1016/j.soard.2023.09.026,10.3389/fpsyg.2023.1106571,10.2196/46415,10.1101/2023.04.20.23288698,10.1111/joes.12620,10.1101/2024.04.22.24306094,10.1007/s00401-024-02721-1,10.1101/2024.02.28.582621,10.1016/j.neuron.2024.01.008,10.1002/alz.13576,10.1001/jamaneurol.2023.3599,10.1186/s40478-023-01626-6,10.1111/acel.13938,10.1101/2023.07.20.23292771,10.1101/2023.07.06.23292312,10.1101/2023.04.21.23288938,10.1186/s13024-022-00590-4,10.1186/s13058-024-01777-x,10.1117/1.jmi.10.5.054503,10.1002/mp.17040,10.1016/j.brat.2024.104494,10.1176/appi.ajp.20230272,10.1001/jamapsychiatry.2023.5138,10.1016/j.addbeh.2023.107911,10.1016/j.explore.2023.11.001,10.1038/s44220-023-00084-2,10.1007/s40429-023-00501-7,10.1016/j.drugalcdep.2023.109890,10.1145/3631461.3631550,10.1016/j.jcss.2023.02.004,10.1080/15384101.2021.2023304,10.3390/ijms241713272,10.1016/j.jval.2024.01.020,10.1038/s41366-023-01396-0,10.1021/acs.jpcc.3c04680,10.1021/acs.jpcc.4c01814,10.4025/actascilangcult.v45i2.67723,10.1007/s10915-023-02353-9,10.1007/s42967-023-00287-5,10.1007/s10543-023-00954-2,10.1128/jvi.00398-22,10.1093/genetics/iyad216,10.1101/2023.10.17.562696
9852805,0.262666,0.441082,0.820559,0.478849,0.504097,0.722874,0.713764,0.419868,0.080667,0.654289,0.153135,0.701182,0.452925,0.07361,0.61437,0.649757,0.537657,0.577775,0.782387,0.776079,0.641858,0.76721,0.605969,0.770769,0.702675,0.87734,0.89131,0.916502,0.989383,0.754168,0.643046,0.6053,0.789495,0.709521,0.710967,0.714062,0.776797,0.715671,0.675283,0.650886,0.811237,0.831983,0.787048,0.824379,0.850339,0.838164,0.815392,0.778223,0.607815,0.827489,0.575307,0.504337,0.475772,0.355766,0.467155,0.73907,0.508183,0.650884,0.787172,0.767981,0.818886,0.43345,0.561021,0.612363,0.620162,0.647592,0.66276,0.965715,0.64127,0.67854,0.720668,0.549566,0.541473,0.550933,0.697586,0.887377,0.944899,0.496868,0.927216,0.773003,0.956205,0.880002,0.684102,0.69848,0.496962,0.893078,0.673056,0.700267,0.767099,0.877555,0.286607,0.553311,0.944757,0.985237,0.512319,0.512319,0.811386,0.635433,0.841817,0.672381,1.0,0.77946,0.894043,0.503658,0.738118,0.39565,0.665235,0.629105,0.836386,0.800656,0.821211,0.087,0.519984,0.766727,0.524362,0.553661,0.561086,0.946476,1.0,0.447283,0.368606,0.783258,0.618944,0.741847,0.658816,0.722477,0.812531,0.699587,0.785305,0.782799,0.518565,0.642814,0.733077,0.793753,0.825683,0.186724,0.273326,0.847439,0.920057,0.764836,0.547942,0.675172,0.964621,0.96139,0.991986,0.675149,0.727125,1.0,0.566531,0.70021,0.625355,0.742308,0.620244,0.718928,0.786491,0.677448,0.773813,0.671237,0.662895,0.763573,0.913159,0.771645,0.901144,0.925688,0.725895,0.833413,0.90628,0.887434,0.810448,0.782528,0.945104,0.911476,0.700674,0.600647,0.64737,0.391865,0.644353,0.897734,0.627559,0.848961,1.0,0.438401,0.715135,0.830768,0.992972,0.525904,0.835105,0.535832,0.806124,0.622946,0.637905,0.471817,0.559437,0.477169,0.419752,0.94666,0.586738,0.93009,0.773499,0.675206,0.638229,0.547015,0.818076,0.956156,0.640677,0.688073,1.0,0.786634,1.0,0.445127,0.657075,0.897527,0.809107,0.669831,1.0,0.494179,0.722855,0.956183,0.701397,0.213474,0.083447,0.057637,0.090776,0.031756,0.978595,0.975717,0.489941,0.531583,0.737324,0.79549,0.901069,0.680314,0.752433,0.911395,0.82837,0.666133,0.728757,0.961532,0.544031,0.666717,0.614845,0.623033,0.872903,0.869249,0.731856,0.80126,0.367804,0.535881,0.932832,0.927128,0.967253,0.985215,0.980703,0.965701,0.972926,0.961011,0.897826,0.928639,0.692219,0.661187,0.882746,1.0,0.819608,0.67349,0.774812,0.624885,0.669712,0.756803,0.756803,0.679822,0.821479,0.902887,0.951517,0.963622,0.574681,0.773595,0.771615,0.35916,0.664564,0.618446,0.847109,0.692717,0.653164,0.102521,0.785211,0.7539,0.799474,0.911258,0.309901,0.326208,0.484199,0.587577,0.568052,0.814261,0.447955,0.677839,0.696504,0.557389,0.473626,0.832236,0.831137,0.916011,1.0,0.756124,0.8985,0.961146,0.892735,0.882022,0.719101,0.721786,0.546327,0.971738,0.876748,0.8444,0.894343,0.87117,0.844405,0.057335,0.457105,0.519185,0.541472,0.541472,0.88066,0.998302,0.997452,1.0,0.900538,0.642713,0.534547,0.669762,0.604232,0.599042,0.729198,0.453292,0.466646,0.68147,0.460107,1.0,0.883277,0.670752,0.745115,0.802766,0.748647,0.735183,0.648609,0.556933,0.399248,0.842254,0.707084,0.823905,0.599386,0.705669,0.96015,0.933105,0.97621,0.990176,0.972985,0.97636,0.909353,0.913991,0.946518,0.763174,0.908608,0.723544,0.981409,0.6516,0.604418,0.801526,0.752259,0.632171,0.621218,0.616441,0.604048,0.541278,0.717461,0.695544,0.712042,0.828062,0.6738,0.525542,0.477689,0.510604,0.841551,0.666293,0.612836,0.759975,0.615171,0.918746,0.880302,0.921044,0.818723,0.864373,0.793981,0.889293,0.794537,1.0,0.920052,0.891061,0.659759,0.887399,0.713494,0.924891,0.972758,0.971881,0.670253,0.860519,0.710928,1.0,0.853086,0.911571,0.928488,0.809138,0.740859,0.174456,0.094849,0.072949,0.608881,0.433496,0.620541,0.633911,0.901804,0.95195,0.954784,0.907797,0.914482,0.814697,0.845831,1.0,0.807626,0.957545,0.717799,0.966861,0.841316,0.715943,0.558988,0.610406,0.41793,0.893883,0.879855,0.460218,0.565416,0.429357,0.855064,0.509723,0.526846,0.777982,0.637395,0.648606,0.687042,0.622394,0.780182,0.381432,0.479954,0.725291,0.447986,0.447199,0.300656,0.253685,0.609376,0.383511,0.797457,0.77011,0.802338,0.463079,0.802059,0.963081,0.821598,0.965828,0.800104,0.72791,0.826989,0.590465,0.834031,0.797413,0.826915,0.752049,0.720781,0.506024,0.518615,0.895018,0.796879,0.960217,0.887497,0.911159,0.923088,0.866205,0.547543,0.444619,0.41827,0.795179,0.764961,0.878422,0.991368,0.671462,0.862322,0.721847,0.658652,0.921029,0.666098,0.929733,0.531063,0.908526,0.598997,0.598997,0.862047,0.89169,0.509872,0.57813,0.515809,0.522488,0.437212,0.54053,0.823895,0.609843,0.605777,0.618501,0.549907,0.52501,0.638518,0.755483,0.514283,0.808651,0.71896,0.564861,0.547583,0.607295,0.638775,0.495385,0.67479,0.665014,0.562773,0.748688,0.986704,0.67838,0.650313,0.574703,0.470955,0.5769,0.433436,0.496428,0.403497,0.109643,0.415602,0.384251,0.90207,0.904414,0.965417,0.786541,0.479086,0.472029,0.52716,0.729678,0.464416,0.930063,0.83922,0.638816,0.583177,0.516803,0.597296,0.798813,0.732638,0.856526,0.675778,0.906082,0.488912,0.525908,0.560616,0.711219,0.66607,0.616767,0.560859,0.449747,0.476261,0.47666,0.572556,0.555628,0.614789,0.726994,0.426011,0.435157,0.52557,0.757662,0.458599,0.578364,0.872731,0.811772,0.747264,0.656973,0.889954,1.0,0.588881,0.723205,0.668179,0.512415,0.60707,0.668179,0.515191,0.713486,0.518659,0.636578,0.553986,0.68069,0.696302,0.679303,0.652641,0.528002,0.547686,0.626846,0.700673,0.548716,0.470625,0.433541,0.538112,0.981703,0.643083,0.702481,0.714501,0.482929,0.624793,0.634329,0.469436,0.498605,0.486985,0.547657,0.577405,0.57527,0.720864,0.552006,0.471052,0.594043,0.71042,0.855316,0.477587,0.490729,0.504449
13062422,0.17986,0.15589,0.428167,0.10528,0.066963,0.370238,0.412277,0.295793,0.41715,0.231221,0.367496,0.508792,0.060272,0.495234,0.314436,0.345379,0.277813,0.326515,0.578028,0.689251,0.284681,0.441845,0.278339,0.382397,0.394335,0.689112,0.759617,0.765097,0.917359,0.512534,0.239292,0.323767,0.703967,0.535815,0.54809,0.539317,0.693416,0.537488,0.400548,0.380821,0.690223,0.724926,0.607064,0.730506,0.762646,0.739292,0.717773,0.685958,0.398398,0.725049,0.233088,0.189992,0.073516,0.242322,0.154999,0.225186,0.150018,0.229638,0.58244,0.621915,0.357598,0.102311,0.182724,0.201417,0.336267,0.708411,0.532374,0.768767,0.203845,0.518431,0.405169,0.13926,0.310477,0.204626,0.479822,0.614967,0.650763,0.059806,0.682056,0.321014,0.796627,0.693482,0.232769,0.227916,0.117068,0.689141,0.300212,0.440525,0.383424,0.751035,0.147604,0.362244,0.823658,0.900063,0.21633,0.21633,0.448541,0.325529,0.79423,0.45226,0.880711,0.346089,0.512779,0.171497,0.597159,0.117258,0.48942,0.352864,0.704973,0.65326,0.715933,0.460147,0.084383,0.462914,0.475999,0.138417,0.26314,0.796984,1.0,0.0573,0.401845,0.728477,0.312579,0.669069,0.522675,0.653322,0.813342,0.596634,0.797309,0.721507,0.228569,0.293548,0.40888,0.42644,0.689392,0.17296,0.416306,0.351313,0.712173,0.500863,0.143973,0.536303,0.792607,0.784533,0.823884,0.557322,0.565513,0.82315,0.185121,0.285456,0.238838,0.508367,0.193459,0.249286,0.391484,0.296642,0.477743,0.423373,0.372236,0.584705,0.732527,0.51337,0.790206,0.718285,0.444667,0.636735,0.743762,0.665538,0.606024,0.585449,0.741952,0.696074,0.476456,0.377116,0.38076,0.199797,0.503627,0.686671,0.300834,0.475563,0.806772,0.196086,0.402788,0.595591,0.942272,0.149837,0.385715,0.123302,0.409898,0.348161,0.277636,0.176125,0.108353,0.165677,0.252789,0.730777,0.17343,0.721387,0.329273,0.414782,0.294973,0.140145,0.548942,0.787463,0.359449,0.539963,0.822959,0.613689,0.842132,0.354965,0.278388,0.69864,0.676488,0.358568,0.858685,0.265124,0.320137,0.701385,0.330493,0.242838,0.556673,0.591684,0.392327,0.474307,0.885363,0.885848,0.154567,0.208426,0.302675,0.350019,0.594535,0.347677,0.497071,0.786259,0.697109,0.393754,0.393244,0.779117,0.283647,0.220865,0.224947,0.224383,0.64357,0.637509,0.265933,0.507989,0.093007,0.243209,0.780729,0.760629,0.840873,0.861555,0.860483,0.823215,0.860313,0.827752,0.702958,0.663032,0.22899,0.227742,0.637803,0.842132,0.539564,0.281402,0.431563,0.23447,0.30533,0.594752,0.594752,0.477605,0.563169,0.657379,0.746747,0.714419,0.216922,0.276803,0.357911,0.239374,0.46454,0.311834,0.568769,0.344613,0.236635,0.619194,0.354232,0.472031,0.475486,0.689034,0.074058,0.140513,0.222578,0.170205,0.132695,0.407244,0.166262,0.371831,0.410927,0.247788,0.24643,0.556371,0.554873,0.66336,0.793613,0.474109,0.56644,0.723259,0.653652,0.594707,0.356055,0.356763,0.103518,0.706222,0.426926,0.654365,0.644499,0.528757,0.758905,0.520961,0.108358,0.158148,0.186443,0.186443,0.694537,0.953698,0.949567,1.0,0.838579,0.476072,0.430293,0.729279,0.606363,0.56815,0.332792,0.324588,0.251716,0.580896,0.107371,1.0,0.629361,0.580485,0.537915,0.551332,0.476958,0.468573,0.352506,0.222557,0.382841,0.605389,0.317919,0.623628,0.421782,0.566666,0.796946,0.849225,0.924287,0.934211,0.889668,0.927734,0.757025,0.801785,0.865559,0.526032,0.806895,0.480601,0.925898,0.335475,0.324233,0.541691,0.495709,0.342692,0.369163,0.364262,0.445906,0.169672,0.705394,0.493604,0.520517,0.70865,0.265993,0.244256,0.099201,0.166424,0.624286,0.334699,0.181946,0.480231,0.322516,0.720856,0.679624,0.724097,0.626037,0.65883,0.570258,0.694546,0.577621,0.849145,0.723357,0.732124,0.34283,0.690934,0.392421,0.830873,0.794087,0.791174,0.33775,0.640406,0.329358,0.870231,0.524417,0.683249,0.73486,0.642612,0.596877,0.413459,0.272547,0.47694,0.138739,0.127213,0.353116,0.148331,0.805265,0.803784,0.80812,0.824156,0.754494,0.681073,0.538355,0.8433,0.502846,0.819971,0.423402,0.777528,0.590633,0.282916,0.203736,0.246262,0.072799,0.62082,0.694684,0.150921,0.293629,0.126521,0.66237,0.152941,0.049085,0.37532,0.261969,0.157847,0.356762,0.377295,0.549562,0.227126,0.241262,0.407252,0.480881,0.234533,0.399704,0.25091,0.359366,0.215384,0.597748,0.625642,0.661202,0.100254,0.651927,0.777581,0.535308,0.773807,0.455751,0.261449,0.495058,0.153781,0.709438,0.537208,0.704399,0.471766,0.589751,0.514633,0.110571,0.610126,0.511241,0.768353,0.704849,0.727158,0.692533,0.602166,0.569219,0.598508,0.57044,0.317615,0.425447,0.600921,0.8196,0.27993,0.688387,0.479022,0.314356,0.738782,0.181443,0.792742,0.253559,0.766479,0.179489,0.179489,0.570051,0.618063,0.136968,0.251539,0.139974,0.105109,0.119384,0.208328,0.434661,0.214305,0.173364,0.234485,0.152697,0.133407,0.320426,0.454875,0.135433,0.600792,0.410431,0.340706,0.200396,0.192095,0.278294,0.235826,0.299681,0.34979,0.164447,0.400944,0.819561,0.240861,0.343031,0.189045,0.10172,0.217346,0.17686,0.132062,0.079608,0.511238,0.125492,0.104185,0.740619,0.721695,0.739207,0.708505,0.07068,0.067803,0.144627,0.245531,0.068962,0.847731,0.670289,0.27272,0.23779,0.187107,0.376532,0.548004,0.741511,0.633234,0.31139,0.664029,0.076654,0.107169,0.174059,0.410792,0.303879,0.385004,0.174847,0.097756,0.087464,0.103822,0.165131,0.18947,0.363565,0.684814,0.1435,0.116054,0.395953,0.569422,0.090568,0.17765,0.685223,0.620735,0.485107,0.33246,0.58869,0.931078,0.238907,0.38419,0.276257,0.127107,0.213573,0.276257,0.171393,0.433193,0.138241,0.306016,0.146288,0.302727,0.450491,0.342567,0.353426,0.14138,0.158721,0.28295,0.440965,0.163282,0.110359,0.093759,0.140933,0.792474,0.250203,0.293818,0.433834,0.115356,0.172152,0.324614,0.081422,0.097908,0.119519,0.079165,0.206479,0.229307,0.204019,0.166152,0.05794,0.238416,0.352851,0.685439,0.096627,0.113831,0.121349
13528070,0.33633,0.329994,0.518554,0.256001,0.161441,0.462453,0.384875,0.291489,0.483396,0.342204,0.425785,0.619544,0.196455,0.533621,0.420258,0.456457,0.420334,0.461212,0.680907,0.751767,0.441227,0.600194,0.518212,0.451075,0.537096,0.788235,0.861136,0.8579,0.983049,0.252478,0.375396,0.445774,0.873015,0.719106,0.680104,0.683135,0.838262,0.733043,0.590114,0.534079,0.847589,0.871293,0.777538,0.874853,0.9001,0.863228,0.867156,0.827328,0.573704,0.873712,0.331543,0.306197,0.153243,0.376487,0.270863,0.347,0.217063,0.344705,0.700971,0.545882,0.364311,0.230092,0.234338,0.34607,0.440201,0.772086,0.578527,0.653452,0.359846,0.622776,0.569769,0.264109,0.322893,0.27373,0.481266,0.628964,0.681161,0.209557,0.596247,0.419574,0.671032,0.646225,0.39862,0.278095,0.286414,0.649184,0.355203,0.558658,0.601292,0.857537,0.242724,0.418683,0.906626,0.97434,0.448492,0.448492,0.519937,0.485179,0.82639,0.48888,1.0,0.443535,0.522332,0.384377,0.72221,0.306662,0.585853,0.653588,0.957993,0.904591,0.382218,0.490627,0.293058,0.464168,0.534433,0.311262,0.372596,0.898265,1.0,0.204725,0.477691,0.770096,0.476362,0.767782,0.655261,0.712903,0.856855,0.686913,0.85411,0.772435,0.436835,0.354426,0.40223,0.612401,0.66106,0.197087,0.504999,0.487908,0.736476,0.485432,0.214179,0.620641,0.856201,0.847003,0.87313,0.674549,0.74827,0.913606,0.337358,0.472815,0.414326,0.634667,0.119979,0.339198,0.454145,0.364516,0.252004,0.569801,0.490662,0.565031,0.664573,0.500436,0.690042,0.641968,0.46944,0.575228,0.652643,0.595388,0.553392,0.52707,0.66111,0.63385,0.731624,0.610696,0.551887,0.367433,0.578657,0.814615,0.407026,0.640413,0.711582,0.235956,0.592333,0.770581,0.959066,0.236371,0.457219,0.230484,0.595691,0.461283,0.368599,0.185112,0.304029,0.35643,0.291535,0.712864,0.388541,0.691693,0.461541,0.540048,0.470301,0.245438,0.659774,0.661893,0.380042,0.526099,0.697701,0.749269,0.912155,0.53968,0.35127,0.807632,0.648546,0.511683,0.780687,0.405142,0.365092,0.639162,0.393973,0.307719,0.617733,0.621596,0.453291,0.520309,0.448665,0.447149,0.321155,0.376936,0.522336,0.353755,0.727457,0.524465,0.520597,0.784791,0.743664,0.530631,0.402401,0.726765,0.255903,0.297849,0.295982,0.299055,0.720705,0.715377,0.50399,0.725716,0.301768,0.257766,0.898716,0.889383,0.950658,0.966643,0.970657,0.937224,0.962116,0.94024,0.836316,0.659729,0.326915,0.347567,0.725671,0.912155,0.617197,0.289709,0.497997,0.349546,0.456076,0.630985,0.630985,0.558059,0.609695,0.594031,0.720717,0.709049,0.234497,0.448888,0.551385,0.358425,0.52989,0.448964,0.481029,0.434504,0.348473,0.647737,0.448161,0.490276,0.480868,0.657598,0.181408,0.24774,0.25372,0.353745,0.300065,0.424695,0.36979,0.514411,0.575857,0.367356,0.363704,0.610147,0.608947,0.724198,0.801572,0.561878,0.62803,0.743252,0.689003,0.639174,0.500907,0.494965,0.231644,0.72763,0.484423,0.704253,0.678549,0.611982,0.898735,0.564304,0.190992,0.316462,0.114676,0.114676,0.416458,0.520649,0.509398,1.0,0.442936,0.529264,0.44159,0.749488,0.636445,0.601482,0.518804,0.481671,0.407483,0.650092,0.295034,1.0,0.556835,0.674695,0.638136,0.532839,0.412103,0.411618,0.543377,0.320801,0.490788,0.730677,0.396457,0.732961,0.542097,0.674636,0.877531,0.890664,0.953313,0.948757,0.885096,0.952093,0.795308,0.849975,0.90697,0.290947,0.851698,0.634635,0.95261,0.532981,0.44029,0.583203,0.625315,0.468382,0.504754,0.492951,0.617612,0.403643,0.714738,0.661417,0.691123,0.756469,0.494095,0.344465,0.2536,0.30312,0.710909,0.497728,0.299689,0.625861,0.478255,0.877018,0.825684,0.878269,0.780173,0.809195,0.736483,0.841662,0.732772,1.0,0.878994,0.869531,0.488181,0.841516,0.189848,0.618843,0.494965,0.531857,0.393552,0.529805,0.458652,0.786621,0.543116,0.644439,0.681491,0.733848,0.685301,0.527123,0.369503,0.512321,0.208517,0.297167,0.509276,0.292709,0.749905,0.742355,0.745542,0.763345,0.691718,0.774871,0.657611,0.756008,0.612063,0.765113,0.551319,0.832681,0.274476,0.361008,0.232281,0.426676,0.23845,0.643185,0.653622,0.241824,0.390859,0.23095,0.626414,0.27852,0.183317,0.411719,0.360568,0.320337,0.543352,0.537533,0.699451,0.39312,0.403242,0.53384,0.667296,0.402519,0.500743,0.410793,0.463741,0.417824,0.765552,0.764204,0.828293,0.257013,0.802439,0.745852,0.510802,0.738562,0.341365,0.281049,0.448963,0.334853,0.957283,0.673391,0.956796,0.394046,0.463191,0.584318,0.233608,0.521009,0.41576,0.443072,0.710624,0.498129,0.433491,0.502117,0.534451,0.628605,0.59902,0.346806,0.516851,0.291097,0.898045,0.381957,0.825538,0.628246,0.457441,0.893844,0.224165,0.91131,0.440039,0.762393,0.397856,0.397856,0.623679,0.657165,0.226979,0.298977,0.206417,0.231195,0.175279,0.310185,0.408732,0.347993,0.272477,0.266287,0.28047,0.215773,0.453912,0.52593,0.206511,0.742865,0.42298,0.439448,0.241902,0.233252,0.30364,0.406333,0.312563,0.350297,0.261958,0.372072,0.757781,0.289398,0.377995,0.220568,0.161565,0.245879,0.22251,0.21932,0.239614,0.581949,0.239186,0.220053,0.669232,0.681276,0.671796,0.851665,0.265058,0.188492,0.320428,0.286671,0.206591,0.847691,0.670934,0.398324,0.388518,0.336124,0.548276,0.232561,0.66599,0.58037,0.256979,0.393873,0.213791,0.207559,0.26641,0.456357,0.351965,0.436096,0.22495,0.204967,0.258164,0.235488,0.302552,0.246789,0.306416,0.58103,0.213073,0.190279,0.347355,0.507084,0.199485,0.220307,0.664713,0.586031,0.590131,0.469482,0.752289,1.0,0.28608,0.376636,0.376991,0.223626,0.266654,0.376991,0.060806,0.56173,0.247736,0.508079,0.222005,0.345327,0.511172,0.430269,0.485775,0.205423,0.231506,0.365232,0.44254,0.328909,0.216022,0.202018,0.23707,0.746064,0.24298,0.379896,0.283979,0.156579,0.254414,0.425565,0.223037,0.168063,0.215603,0.219382,0.32049,0.357045,0.258262,0.327178,0.148523,0.31599,0.433444,0.655289,0.205252,0.206107,0.214587
13057717,0.194412,0.342343,0.402997,0.332677,0.189732,0.361011,0.259252,0.312713,0.486043,0.272471,0.460614,0.500093,0.152424,0.592369,0.595591,0.553456,0.411423,0.531393,0.80107,0.932817,0.482322,0.306892,0.505103,0.418255,0.329409,0.762563,0.824084,0.846356,0.961704,0.490967,0.347956,0.487999,0.734539,0.6476,0.605167,0.613991,0.728516,0.516648,0.451725,0.23291,0.703841,0.743375,0.634297,0.7511,0.777298,0.77245,0.728652,0.723401,0.469192,0.738003,0.243378,0.215292,0.245533,0.361891,0.252389,0.403621,0.318932,0.470691,0.61983,0.536584,0.550277,0.131158,0.347716,0.284973,0.393844,0.77401,0.457852,0.605597,0.188391,0.651403,0.419865,0.218287,0.300728,0.146788,0.402909,0.412857,0.515327,0.161006,0.47188,0.348148,0.613206,0.577916,0.42236,0.453812,0.269631,0.547521,0.516441,0.471969,0.280759,0.789682,0.21882,0.464851,0.872985,0.942443,0.224248,0.224248,0.422623,0.3342,0.907994,0.340878,0.560633,0.297204,0.687393,0.296142,0.700549,0.346502,0.579582,0.496365,0.868989,0.821237,0.736456,0.585907,0.207194,0.310247,0.420688,0.191094,0.453839,0.939129,1.0,0.253364,0.454358,0.828737,0.410743,0.800436,0.647657,0.773202,0.906013,0.712152,0.875691,0.830066,0.383241,0.277094,0.385731,0.496453,0.63047,0.295802,0.605714,0.496099,0.643315,0.724755,0.242562,0.636214,0.788562,0.775612,0.831532,0.518628,0.602397,0.649097,0.296379,0.408661,0.325087,0.652721,0.214008,0.349576,0.658069,0.266342,0.524812,0.356493,0.453441,0.696394,0.831484,0.741112,0.92111,0.854717,0.623632,0.797755,0.899247,0.781368,0.759868,0.760973,0.909977,0.774061,0.660097,0.570641,0.299555,0.436986,0.265617,0.418601,0.143612,0.235823,0.559372,0.313635,0.274722,0.358976,0.959577,0.456531,0.575799,0.215015,0.573512,0.545386,0.289043,0.195072,0.221584,0.197821,0.505451,0.439214,0.236429,0.493122,0.497249,0.449561,0.413919,0.198125,0.725144,0.612482,0.368146,0.407657,0.620612,0.540471,0.724055,0.352208,0.286094,0.615089,0.606492,0.26702,0.690979,0.306049,0.2241,0.497777,0.503587,0.292744,0.62549,0.676151,0.489044,0.574238,0.88815,0.894892,0.333477,0.387809,0.200192,0.18851,0.310922,0.280597,0.253477,0.632628,0.897533,0.483771,0.281883,0.678003,0.250282,0.133258,0.125895,0.353422,0.680216,0.675552,0.265104,0.511238,0.209102,0.326526,0.850841,0.869875,0.948836,0.954226,0.955946,0.938379,0.977975,0.923711,0.801389,0.423521,0.228492,0.518055,0.529378,0.724055,0.511273,0.301884,0.395068,0.336682,0.466466,0.736232,0.736232,0.472137,0.418746,0.463536,0.540396,0.511618,0.196509,0.331236,0.320818,0.314254,0.38953,0.335434,0.428926,0.446505,0.509929,0.707515,0.470029,0.33694,0.256419,0.536642,0.186513,0.1839,0.41359,0.273511,0.298886,0.645169,0.27918,0.477051,0.483917,0.390875,0.413842,0.699473,0.698147,0.72282,0.905884,0.574588,0.715587,0.84829,0.76266,0.749878,0.500135,0.504914,0.230378,0.841863,0.518034,0.804703,0.770965,0.664586,0.771171,0.609242,0.316833,0.200366,0.223965,0.223965,0.765851,0.981593,0.975701,1.0,0.859084,0.527955,0.424889,0.727178,0.656343,0.613938,0.423368,0.522046,0.372192,0.590723,0.288632,1.0,0.452927,0.45862,0.449873,0.324216,0.362604,0.362032,0.290533,0.496661,0.527908,0.584479,0.459039,0.675486,0.492472,0.695187,0.811445,0.877427,0.938554,0.948572,0.885693,0.947972,0.770196,0.834217,0.892902,0.537732,0.826035,0.395886,0.938376,0.24636,0.354669,0.69437,0.572079,0.386463,0.461238,0.475898,0.486598,0.224717,0.76685,0.574156,0.518834,0.741792,0.428798,0.455876,0.189138,0.292231,0.790809,0.359835,0.23221,0.257759,0.177957,0.44963,0.414655,0.452122,0.425616,0.40103,0.328717,0.440537,0.392382,0.715007,0.451163,0.437897,0.270043,0.441164,0.372604,0.725565,0.630592,0.653175,0.280314,0.422421,0.242496,0.729828,0.309405,0.594371,0.600638,0.642878,0.631924,0.530111,0.395375,0.571935,0.407745,0.244505,0.399051,0.416357,0.658998,0.673874,0.67742,0.659629,0.611664,0.703796,0.27433,0.633236,0.283168,0.621529,0.476624,0.781687,0.72274,0.541576,0.299582,0.434617,0.223398,0.546441,0.593011,0.372231,0.326102,0.326599,0.569505,0.184519,0.220325,0.536537,0.574838,0.261786,0.55172,0.454124,0.62414,0.37007,0.278023,0.331065,0.586904,0.32986,0.451268,0.326121,0.478868,0.284362,0.601657,0.686866,0.669267,0.357741,0.691935,0.556566,0.270217,0.549333,0.545519,0.359239,0.446358,0.193869,0.874446,0.625638,0.870729,0.392303,0.475566,0.391468,0.246848,0.473075,0.394965,0.675014,0.595324,0.586437,0.534947,0.454697,0.641665,0.658448,0.651186,0.262239,0.715695,0.73636,0.695728,0.574664,0.423945,0.233942,0.145255,0.463977,0.207373,0.494564,0.267513,0.867383,0.262543,0.262543,0.698171,0.741455,0.177643,0.175011,0.194326,0.182893,0.134819,0.202396,0.237191,0.216359,0.297715,0.402528,0.184625,0.129767,0.183001,0.195901,0.106301,0.292459,0.298056,0.182815,0.183909,0.159892,0.293362,0.203262,0.205628,0.280812,0.068292,0.311199,0.635692,0.142027,0.24314,0.147002,0.187033,0.128417,0.233424,0.18239,0.188995,0.614316,0.230522,0.168509,0.581032,0.568733,0.575627,0.723753,0.161483,0.161775,0.222169,0.303727,0.194783,0.843301,0.631996,0.26568,0.309089,0.294056,0.531951,0.491347,0.655169,0.551478,0.278035,0.528622,0.224807,0.153639,0.145651,0.247668,0.296375,0.278783,0.134483,0.17732,0.201857,0.148292,0.169167,0.200579,0.265561,0.718925,0.229035,0.199958,0.336652,0.554888,0.137923,0.168421,0.495446,0.43106,0.538327,0.39881,0.740044,0.967488,0.265549,0.247258,0.292293,0.189789,0.267049,0.292293,0.278899,0.206513,0.119331,0.217304,0.23782,0.264172,0.334438,0.258061,0.201217,0.248594,0.174876,0.213881,0.346315,0.220502,0.131975,0.161471,0.169875,0.531796,0.209702,0.188459,0.291559,0.129257,0.281719,0.355092,0.215854,0.206173,0.128895,0.162093,0.161496,0.274672,0.301561,0.242427,0.191221,0.288023,0.491037,0.846974,0.126821,0.155465,0.150269
13308163,0.261085,0.327806,0.677393,0.345676,0.242145,0.387128,0.526297,0.158824,0.224268,0.423237,0.251969,0.742773,0.25418,0.249977,0.510761,0.538365,0.466208,0.523676,0.737826,0.807011,0.536328,0.744862,0.456671,0.708898,0.558435,0.776687,0.823807,0.832157,0.950499,0.389291,0.500493,0.523247,0.849876,0.656951,0.751924,0.788177,0.834169,0.755683,0.597764,0.514123,0.843626,0.874775,0.790477,0.865772,0.891917,0.884783,0.85414,0.829387,0.598884,0.867631,0.445072,0.384249,0.256799,0.297413,0.353198,0.424295,0.298739,0.403999,0.639448,0.459362,0.375561,0.251505,0.362075,0.511206,0.31136,0.505422,0.403627,0.602791,0.369837,0.656525,0.646836,0.325732,0.221034,0.41387,0.670572,0.808633,0.818372,0.314024,0.700605,0.556838,0.62109,0.595839,0.554041,0.477643,0.357303,0.810466,0.364769,0.673938,0.651464,0.826219,0.199325,0.384493,0.899112,0.935314,0.470045,0.470045,0.620707,0.548031,0.865914,0.420491,0.923209,0.476768,0.640615,0.452955,0.880838,0.298754,0.633605,0.66331,0.965162,0.895859,0.578631,0.286647,0.300278,0.418838,0.523876,0.424327,0.413944,0.913286,1.0,0.243247,0.39115,0.766692,0.521335,0.759462,0.663614,0.72336,0.856215,0.717902,0.844601,0.802636,0.318766,0.320504,0.496842,0.565362,0.5237,0.065047,0.273334,0.528954,0.636105,0.574214,0.352298,0.456134,0.824294,0.815903,0.85714,0.767606,0.747714,0.956248,0.244635,0.453046,0.502498,0.663267,0.262877,0.374831,0.551174,0.37737,0.454273,0.697893,0.667938,0.690758,0.830797,0.615434,0.832775,0.838022,0.577414,0.729153,0.814423,0.77944,0.692043,0.696694,0.836045,0.78209,0.743351,0.614401,0.535545,0.252796,0.41004,0.722283,0.377268,0.718884,0.647036,0.190579,0.586641,0.747176,0.786464,0.268342,0.647556,0.290163,0.538963,0.598727,0.437801,0.204359,0.387135,0.376084,0.298828,0.698737,0.28311,0.871635,0.627054,0.706041,0.6084,0.418774,0.788773,0.619936,0.345814,0.348199,0.676044,0.75975,0.969644,0.478027,0.464548,0.816015,0.701318,0.566372,0.964684,0.216913,0.564041,0.848256,0.537385,0.188591,0.30135,0.299347,0.220763,0.223262,0.689993,0.686506,0.325326,0.427772,0.559919,0.549434,0.67557,0.61673,0.649178,0.911299,0.885044,0.581932,0.573302,0.849015,0.381982,0.424434,0.454886,0.328603,0.710232,0.705619,0.458015,0.67151,0.245504,0.375017,0.893964,0.909293,0.951824,0.976596,0.980428,0.948928,0.964692,0.952537,0.86522,0.818042,0.540105,0.439955,0.797941,0.969644,0.69645,0.379269,0.583789,0.38385,0.573052,0.697666,0.697666,0.454208,0.695845,0.748453,0.861036,0.817905,0.266919,0.579658,0.673297,0.374035,0.456353,0.58327,0.496572,0.580374,0.385223,0.319688,0.481807,0.566963,0.628054,0.825152,0.145074,0.126212,0.216254,0.361014,0.271281,0.506537,0.370128,0.623604,0.63442,0.433048,0.330985,0.736421,0.735119,0.851471,0.93781,0.705439,0.76754,0.869832,0.807826,0.795334,0.669967,0.6701,0.322072,0.885774,0.664401,0.809294,0.790515,0.724198,0.891383,0.28118,0.245192,0.358862,0.273541,0.273541,0.621276,0.732269,0.741951,1.0,0.645348,0.362266,0.271898,0.491301,0.423833,0.404274,0.476912,0.399565,0.336626,0.652169,0.332791,1.0,0.548592,0.464042,0.536338,0.503172,0.408899,0.400867,0.580901,0.316544,0.399855,0.861835,0.507971,0.835797,0.515437,0.647045,0.767503,0.71868,0.790992,0.775545,0.717559,0.770834,0.635579,0.681471,0.742389,0.393169,0.674189,0.556524,0.778219,0.479703,0.558419,0.732541,0.797152,0.599608,0.638741,0.669932,0.56507,0.456093,0.548225,0.6445,0.669841,0.814952,0.426596,0.291383,0.218444,0.261723,0.634189,0.37924,0.340189,0.610997,0.45776,0.852586,0.79185,0.854022,0.740231,0.777174,0.691916,0.7944,0.707712,0.95019,0.853678,0.818569,0.500553,0.789963,0.295033,0.514155,0.587844,0.588218,0.333004,0.508099,0.654128,0.939359,0.703891,0.824506,0.865435,0.884856,0.850334,0.291227,0.126134,0.232002,0.37185,0.331855,0.601385,0.365955,0.897357,0.907924,0.911508,0.90016,0.844699,0.918665,0.650737,0.935672,0.60808,0.92994,0.50346,0.806039,0.458866,0.444098,0.280435,0.331861,0.223036,0.55878,0.701353,0.276005,0.282507,0.268789,0.655425,0.233101,0.268116,0.46446,0.401107,0.395212,0.487868,0.416516,0.502413,0.239193,0.339101,0.631819,0.397858,0.270729,0.195959,0.18306,0.490868,0.382236,0.785728,0.781202,0.81141,0.279464,0.806484,0.910742,0.655285,0.900418,0.401467,0.46929,0.476838,0.412406,0.958178,0.518345,0.95337,0.32448,0.338943,0.498246,0.283488,0.496845,0.423755,0.628146,0.632331,0.517912,0.532748,0.518976,0.341073,0.356451,0.327055,0.431246,0.565543,0.507631,0.956606,0.433034,0.744497,0.636515,0.493054,0.818381,0.41087,0.844311,0.412979,0.884507,0.454469,0.454469,0.745834,0.784903,0.213974,0.340282,0.239803,0.318835,0.153993,0.243401,0.436936,0.343712,0.440638,0.392717,0.388941,0.251631,0.360155,0.536766,0.31727,0.713396,0.578022,0.416978,0.333365,0.365121,0.452251,0.434015,0.408913,0.474965,0.346643,0.542945,0.926552,0.356044,0.354022,0.320039,0.179103,0.256129,0.20259,0.253206,0.198766,0.275122,0.189602,0.183499,0.830306,0.839693,0.846233,0.83318,0.283385,0.235117,0.258802,0.498546,0.157798,0.658329,0.516384,0.508814,0.43957,0.432696,0.650917,0.361164,0.518921,0.491345,0.262138,0.441997,0.287473,0.261035,0.285666,0.478653,0.411134,0.409901,0.323293,0.229767,0.296782,0.216285,0.262947,0.239883,0.302182,0.485485,0.1374,0.147427,0.238907,0.375207,0.228677,0.337848,0.787717,0.699611,0.556669,0.507566,0.686896,0.963334,0.249452,0.347205,0.313515,0.200636,0.251999,0.313515,0.179178,0.49313,0.275222,0.495254,0.326707,0.353805,0.358918,0.358001,0.389846,0.287734,0.245212,0.306245,0.326342,0.424519,0.255972,0.207562,0.223504,0.906752,0.259654,0.417306,0.391767,0.180284,0.323243,0.342334,0.270999,0.249231,0.233112,0.282734,0.310479,0.333441,0.371975,0.395267,0.182137,0.430047,0.611919,0.810174,0.254213,0.236,0.248133


In [13]:
data_matrix = np.array(data_matrix)

gb_raw_shape = data_matrix.shape
print(gb_raw_shape)

gb_data = []
for i in range(gb_raw_shape[1]):
    gb_data.extend(data_matrix[:, i, :])
gb_data = np.array(gb_data)
print(gb_data.shape)

project_numbers = np.array(list(range(1, gb_raw_shape[0] + 1)) * gb_raw_shape[1])

project_numbers = np.array(list(range(1, gb_raw_shape[0] + 1)) * gb_raw_shape[1])

# get the projects for lowest predictions for each publication with distance matrix
for num_top in range(10, 0, -1):
    project_numbers_pred = []
    for i in range(len(train_pub_data), distance_matrix.shape[1]):
        project_numbers_pred.append(list(np.argsort(distance_matrix[:, i] + 1))[:num_top])

    project_lists = []
    for i in range(0, gb_data.shape[0], gb_raw_shape[0]):
        pub_belongs = gb_data[i:i + gb_raw_shape[0], 0] * project_numbers[i:i + gb_raw_shape[0]]
        project = sorted(list(pub_belongs[pub_belongs != 0].astype(int)), reverse=True)
        project_lists.append(project)

    project_lists_test = project_lists[len(train_pub_data):]

    # calculate accuracy
    # use y_test as mask for project_numbers_test
    accuracy_list = []
    for i, project_list in enumerate(list(project_lists_test)):
        ratio = len(set(project_numbers_pred[i]) & set(project_list)) / len(set(project_list))
        accuracy_list.append(ratio)

    accuracy = sum(accuracy_list) / len(accuracy_list)
    print(accuracy)

(225, 635, 2)
(142875, 2)
0.08527131782945736
0.06976744186046512
0.046511627906976744
0.03875968992248062
0.015503875968992248
0.015503875968992248
0.015503875968992248
0.015503875968992248
0.007751937984496124
0.0
