In [1]:
import os
import time
import json
import requests

from tqdm import tqdm
from ast import literal_eval
import numpy as np
import pandas as pd

In [2]:
def merge_annotations(x, y):
    if type(y) == str:
        return y.strip().lower()
    return x.strip().lower()

def load_kim_dataset(data_filename = '/export/scratch/zeren/KimNLP/RawData/dec_12_annotations.tsv'):
    data = pd.read_csv(data_filename, sep='\t')

    data['annotation'] = data.apply(lambda x: merge_annotations(x['previous annotation'], x['new annotation']), axis=1)
    # columns = ['cited title', 'cited abstract', 'citing title', 'citing abstract', 'citation context', 'annotation']
    # data = data[columns]
    data = data.rename(columns={
        'cited title': 'cited_title', 
        'cited abstract': 'cited_abstract', 
        'citing title': 'citing_title', 
        'citing abstract': 'citing_abstract', 
        'citation context': 'citation_context', 
        'annotation': 'label'
    }).reset_index().drop(columns='index')
    data = data.fillna('')
    data.head()
    return data

In [5]:
data = load_kim_dataset()
# data.head()
dois = list(set(data['cited doi'].tolist() + data['citing doi'].tolist()))
# data[data['citing doi'] == 'https://doi.org/none_22851346']['citing_title'].tolist()

In [7]:
len(dois)

716

In [10]:
for d in dois:
    if 'none' in d:
        print(d)

https://doi.org/none_28230327
https://doi.org/none_13455990
https://doi.org/none_8217700
https://doi.org/none_26526364
https://doi.org/none_21640901
https://doi.org/none_1153070
https://doi.org/none_15244259
https://doi.org/none_20146078
https://doi.org/none_1789293
https://doi.org/none_5285167
https://doi.org/none_22851346
https://doi.org/none_21795708
https://doi.org/none_13945976
https://doi.org/none_25411478
https://doi.org/none_15360911
https://doi.org/none_1920016
https://doi.org/none_28303267
https://doi.org/none_18529447
https://doi.org/none_23942303
https://doi.org/none_28657560
https://doi.org/none_9096290
https://doi.org/none_17436963
https://doi.org/none_28160190
https://doi.org/none_8051345
https://doi.org/none_24264187
https://doi.org/none_632799
https://doi.org/none_17936269
https://doi.org/none_21013761
https://doi.org/none_8465186
https://doi.org/none_3335766
https://doi.org/none_20756763
https://doi.org/none_27723720
https://doi.org/none_28182591
https://doi.org/none_

In [19]:
dois[0][16:]

'10.1021/acs.jpclett.5b02080'

In [20]:
graphs = []

for doi in tqdm(dois):
    url = 'https://api.semanticscholar.org/graph/v1/paper/DOI:{}?fields=citations,references'.format(doi[16:])
    res = requests.get(url)

    
    if res.status_code == 200:
        res_json = res.json()

        graphs.append(res_json)
    else:
        print(doi)

  1%|▏         | 10/716 [00:03<03:34,  3.29it/s]

https://doi.org/none_8051345


  5%|▍         | 33/716 [00:10<03:23,  3.36it/s]

https://doi.org/none_22304794


  6%|▌         | 41/716 [00:13<03:07,  3.60it/s]

https://doi.org/none_22851346


  8%|▊         | 58/716 [00:18<02:50,  3.85it/s]

https://doi.org/none_28303267


  9%|▉         | 67/716 [00:20<03:00,  3.60it/s]

https://doi.org/none_17436963


 10%|▉         | 71/716 [00:22<03:01,  3.56it/s]

https://doi.org/none_3335766


 12%|█▏        | 88/716 [00:27<02:59,  3.50it/s]

https://doi.org/none_28230327


 15%|█▍        | 106/716 [00:32<02:48,  3.63it/s]

https://doi.org/none_13455990


 18%|█▊        | 126/716 [00:39<02:39,  3.70it/s]

https://doi.org/none_8217700


 19%|█▉        | 135/716 [00:42<03:02,  3.19it/s]

https://doi.org/none_26526364


 28%|██▊       | 203/716 [01:04<02:36,  3.27it/s]

https://doi.org/none_27723720


 29%|██▊       | 205/716 [01:05<02:21,  3.61it/s]

https://doi.org/10.1080/14786435.2018.1480838


 29%|██▉       | 207/716 [01:05<02:32,  3.34it/s]

https://doi.org/none_28160190


 29%|██▉       | 209/716 [01:06<02:11,  3.86it/s]

https://doi.org/10.1107/s0108767318095934


 29%|██▉       | 210/716 [01:06<02:21,  3.56it/s]

https://doi.org/10.1186/1556-276x-6-291


 30%|███       | 215/716 [01:07<01:34,  5.28it/s]

https://doi.org/10.1016/j.commatsci.2017.03.028
https://doi.org/10.3390/ma12050750


 30%|███       | 217/716 [01:07<01:34,  5.30it/s]

https://doi.org/10.1021/jp5030558


 31%|███       | 220/716 [01:08<01:36,  5.15it/s]

https://doi.org/10.1155/2013/965282
https://doi.org/10.1186/s11671-017-2412-2


 31%|███       | 221/716 [01:08<01:23,  5.93it/s]

https://doi.org/10.1007/s13632-012-0008-x


 31%|███▏      | 225/716 [01:09<01:55,  4.24it/s]

https://doi.org/10.1016/j.carbon.2016.03.007
https://doi.org/none_15244259


 32%|███▏      | 226/716 [01:09<01:48,  4.52it/s]

https://doi.org/10.1186/1556-276x-7-148


 32%|███▏      | 228/716 [01:10<02:03,  3.96it/s]

https://doi.org/none_21640901


 32%|███▏      | 231/716 [01:11<01:49,  4.42it/s]

https://doi.org/10.1016/j.jnucmat.2014.12.111
https://doi.org/10.1103/physrevb.54.8398


 33%|███▎      | 233/716 [01:11<01:26,  5.57it/s]

https://doi.org/10.1021/acsomega.7b00732
https://doi.org/10.1007/s12274-009-9078-8
https://doi.org/10.1021/acs.jpcc.6b10908


 33%|███▎      | 236/716 [01:11<01:20,  5.95it/s]

https://doi.org/10.1016/j.actamat.2015.07.055
https://doi.org/10.1103/physrevb.95.045418


 33%|███▎      | 238/716 [01:12<01:14,  6.43it/s]

https://doi.org/10.1016/j.jallcom.2015.09.149
https://doi.org/10.1016/j.commatsci.2018.02.020


 34%|███▎      | 241/716 [01:12<01:04,  7.31it/s]

https://doi.org/none_20376022
https://doi.org/10.1016/j.physe.2017.06.012
https://doi.org/10.1007/s00214-015-1681-z


 34%|███▍      | 243/716 [01:12<01:09,  6.84it/s]

https://doi.org/none_632799
https://doi.org/10.1088/0965-0393/19/8/083001


 34%|███▍      | 245/716 [01:13<01:06,  7.08it/s]

https://doi.org/10.1021/acsomega.9b00589
https://doi.org/10.1051/m2an:2007024


 34%|███▍      | 247/716 [01:13<00:57,  8.19it/s]

https://doi.org/10.1186/s40199-014-0085-2
https://doi.org/10.1016/j.physrep.2014.03.003


 35%|███▍      | 249/716 [01:13<01:11,  6.50it/s]

https://doi.org/10.1038/srep43785
https://doi.org/10.1073/pnas.1510342112


 35%|███▌      | 251/716 [01:14<01:07,  6.85it/s]

https://doi.org/10.1103/physreve.84.061122
https://doi.org/10.1016/j.physe.2017.03.005


 35%|███▌      | 253/716 [01:14<00:57,  8.10it/s]

https://doi.org/10.1038/s41524-018-0098-3
https://doi.org/10.1103/physrevb.41.12197


 36%|███▌      | 255/716 [01:14<01:11,  6.43it/s]

https://doi.org/10.1063/1.3460127
https://doi.org/10.1016/j.carbon.2015.02.075


 36%|███▌      | 257/716 [01:14<01:08,  6.70it/s]

https://doi.org/10.1109/tnano.2019.2935876
https://doi.org/10.1016/j.physrep.2018.03.001


 36%|███▌      | 258/716 [01:15<01:13,  6.22it/s]

https://doi.org/10.16984/saufenbilder.489467
https://doi.org/10.1016/j.actamat.2018.09.052


 36%|███▋      | 261/716 [01:15<01:12,  6.31it/s]

https://doi.org/10.7454/mss.v22i3.8512
https://doi.org/10.1260/1750-9548.7.2.95


 37%|███▋      | 262/716 [01:15<01:06,  6.85it/s]

https://doi.org/10.3390/met8060430
https://doi.org/10.3390/ma12020217


 37%|███▋      | 265/716 [01:16<00:59,  7.53it/s]

https://doi.org/10.1016/j.jmps.2007.09.005
https://doi.org/10.1021/jp101332k


 37%|███▋      | 268/716 [01:16<00:56,  7.96it/s]

https://doi.org/10.1038/srep34074
https://doi.org/10.1103/physrevb.43.12571
https://doi.org/10.1186/s40759-019-0042-3


 38%|███▊      | 270/716 [01:16<00:51,  8.66it/s]

https://doi.org/10.1073/pnas.1505788112
https://doi.org/10.3390/polym10111289


 38%|███▊      | 272/716 [01:16<00:57,  7.67it/s]

https://doi.org/10.1080/01418619508244468
https://doi.org/10.3390/ma12152354


 38%|███▊      | 273/716 [01:17<00:54,  8.10it/s]

https://doi.org/10.1016/j.actamat.2015.08.052
https://doi.org/10.3390/nano8100848


 39%|███▊      | 276/716 [01:17<01:02,  7.00it/s]

https://doi.org/10.2207/qjjws.23.509
https://doi.org/10.1088/0965-0393/21/8/085004


 39%|███▉      | 278/716 [01:17<01:02,  7.02it/s]

https://doi.org/none_25411478
https://doi.org/10.2991/icamcs-16.2016.64


 39%|███▉      | 280/716 [01:18<01:00,  7.16it/s]

https://doi.org/10.1016/j.carbon.2016.05.009
https://doi.org/none_3387763


 39%|███▉      | 282/716 [01:18<01:02,  6.96it/s]

https://doi.org/10.3390/en10122010
https://doi.org/10.1115/1.4006750


 40%|███▉      | 284/716 [01:18<01:00,  7.11it/s]

https://doi.org/10.1103/physrevb.58.2539
https://doi.org/10.1088/1367-2630/11/12/123017


 40%|███▉      | 286/716 [01:18<00:52,  8.22it/s]

https://doi.org/10.20944/preprints201906.0279.v1
https://doi.org/10.1615/intjmultcompeng.2011002514


 40%|████      | 288/716 [01:19<01:04,  6.63it/s]

https://doi.org/10.1038/srep06399
https://doi.org/10.1073/pnas.0806174105


 40%|████      | 289/716 [01:19<01:08,  6.23it/s]

https://doi.org/10.1016/j.cpc.2016.04.001
https://doi.org/10.1016/j.mprp.2018.01.003


 41%|████      | 292/716 [01:19<00:59,  7.14it/s]

https://doi.org/10.1016/j.actamat.2017.08.058
https://doi.org/10.1186/1556-276x-8-490


 41%|████      | 294/716 [01:20<01:09,  6.11it/s]

https://doi.org/10.1007/s00161-009-0109-1
https://doi.org/10.3390/met7100438


 41%|████▏     | 296/716 [01:20<00:56,  7.46it/s]

https://doi.org/none_15360911
https://doi.org/10.1088/0022-3727/47/22/224007


 42%|████▏     | 298/716 [01:20<00:57,  7.32it/s]

https://doi.org/10.1088/0965-0393/21/3/035011
https://doi.org/10.1016/j.msea.2014.12.075


 42%|████▏     | 299/716 [01:20<00:52,  7.92it/s]

https://doi.org/10.1007/s10853-015-8961-9
https://doi.org/10.3390/ma12132076


 42%|████▏     | 302/716 [01:21<00:54,  7.53it/s]

https://doi.org/10.3390/nano9081107
https://doi.org/10.1103/physrevb.95.214302


 42%|████▏     | 304/716 [01:21<00:48,  8.52it/s]

https://doi.org/none_1153070
https://doi.org/10.1038/npjcompumats.2015.11
https://doi.org/10.1186/1556-276x-6-481


 43%|████▎     | 307/716 [01:21<00:56,  7.27it/s]

https://doi.org/10.1073/pnas.1310036110
https://doi.org/10.1016/j.commatsci.2016.12.016


 43%|████▎     | 309/716 [01:22<01:03,  6.44it/s]

https://doi.org/10.3390/cryst7020046
https://doi.org/10.1080/14686996.2017.1422224


 43%|████▎     | 311/716 [01:22<00:52,  7.70it/s]

https://doi.org/10.1103/physrevb.89.054310
https://doi.org/10.1016/j.jallcom.2015.03.173
https://doi.org/10.1080/01418619208247999


 44%|████▍     | 314/716 [01:22<00:46,  8.70it/s]

https://doi.org/10.3390/ma12091477
https://doi.org/10.1177/2516598418765359


 44%|████▍     | 317/716 [01:23<00:47,  8.45it/s]

https://doi.org/10.5539/jmsr.v4n3p15
https://doi.org/10.5772/intechopen.68507
https://doi.org/10.1007/s10853-017-1706-1


 45%|████▍     | 319/716 [01:23<00:52,  7.54it/s]

https://doi.org/10.3390/cryst6070077
https://doi.org/10.1088/0965-0393/23/7/074002


 45%|████▍     | 321/716 [01:23<00:47,  8.39it/s]

https://doi.org/10.1016/j.actamat.2016.07.053
https://doi.org/10.1088/0957-4484/23/2/025703


 45%|████▌     | 323/716 [01:23<00:50,  7.81it/s]

https://doi.org/10.1088/0034-4885/77/4/046501
https://doi.org/10.1039/c7cp01268c


 46%|████▌     | 326/716 [01:24<00:54,  7.18it/s]

https://doi.org/10.1186/s40192-015-0040-1
https://doi.org/10.1038/srep03157
https://doi.org/none_1789293


 46%|████▌     | 328/716 [01:24<00:53,  7.23it/s]

https://doi.org/10.1016/j.commatsci.2009.09.026
https://doi.org/10.2478/s13531-013-0116-7


 46%|████▌     | 329/716 [01:24<01:00,  6.42it/s]

https://doi.org/10.1021/la047545h
https://doi.org/none_10112067


 46%|████▋     | 332/716 [01:25<00:53,  7.22it/s]

https://doi.org/10.1016/j.actamat.2015.11.046
https://doi.org/10.1038/s41598-019-38941-9


 47%|████▋     | 334/716 [01:25<00:52,  7.31it/s]

https://doi.org/10.1021/acsnano.8b04050
https://doi.org/none_12042695


 47%|████▋     | 338/716 [01:25<00:41,  9.07it/s]

https://doi.org/none_18529447
https://doi.org/10.1016/j.jmps.2015.07.001
https://doi.org/10.1103/physrevb.36.6434
https://doi.org/10.1103/physrevb.99.205134


 47%|████▋     | 340/716 [01:26<00:39,  9.44it/s]

https://doi.org/none_25695403
https://doi.org/10.1016/j.carbon.2015.11.012


 48%|████▊     | 342/716 [01:26<00:40,  9.33it/s]

https://doi.org/none_8465186
https://doi.org/10.1038/ncomms7035
https://doi.org/10.1016/j.fluid.2019.05.008


 48%|████▊     | 345/716 [01:26<00:50,  7.28it/s]

https://doi.org/10.1088/0953-8984/19/32/326220
https://doi.org/10.1038/srep12923


 48%|████▊     | 347/716 [01:27<00:52,  7.03it/s]

https://doi.org/10.1088/1361-648x/aae09f
https://doi.org/10.1016/j.commatsci.2014.12.036


 49%|████▊     | 349/716 [01:27<00:45,  8.01it/s]

https://doi.org/10.1073/pnas.1802300115
https://doi.org/10.1021/jp709896w


 49%|████▉     | 350/716 [01:27<00:52,  6.99it/s]

https://doi.org/10.3390/molecules24091693
https://doi.org/10.1098/rspa.2016.0093


 49%|████▉     | 353/716 [01:27<00:48,  7.48it/s]

https://doi.org/10.1515/phys-2016-0040
https://doi.org/10.1002/wcms.1363


 50%|████▉     | 355/716 [01:28<00:56,  6.43it/s]

https://doi.org/10.1109/tdmr.2018.2842253
https://doi.org/10.17586/2220-8054-2015-6-5-650-660


 50%|████▉     | 357/716 [01:28<00:59,  6.06it/s]

https://doi.org/10.1155/2013/434636
https://doi.org/10.1016/j.actamat.2005.05.001


 50%|█████     | 359/716 [01:28<01:01,  5.82it/s]

https://doi.org/10.3390/electronics4041109
https://doi.org/10.1088/0957-4484/27/5/055701


 51%|█████     | 362/716 [01:29<00:45,  7.73it/s]

https://doi.org/10.1016/j.carbon.2018.07.073
https://doi.org/10.1061/9780784413111.008
https://doi.org/10.1038/s41524-017-0042-y


 51%|█████     | 364/716 [01:29<00:54,  6.49it/s]

https://doi.org/10.1016/j.jcp.2014.12.018
https://doi.org/10.1063/1.4905942


 51%|█████     | 366/716 [01:29<00:45,  7.66it/s]

https://doi.org/10.1126/sciadv.1602916
https://doi.org/10.1016/j.commatsci.2018.08.011


 51%|█████▏    | 368/716 [01:30<00:48,  7.10it/s]

https://doi.org/10.1080/08927022.2018.1447107
https://doi.org/10.3390/ma9050355


 52%|█████▏    | 371/716 [01:30<00:40,  8.57it/s]

https://doi.org/10.3390/lubricants6020043
https://doi.org/10.1557/jmr.2008.0090
https://doi.org/10.1103/physrevb.67.125101


 52%|█████▏    | 373/716 [01:30<00:45,  7.52it/s]

https://doi.org/10.1186/s40192-016-0051-6
https://doi.org/10.1016/j.carbon.2017.06.009


 52%|█████▏    | 375/716 [01:30<00:40,  8.47it/s]

https://doi.org/10.1016/j.actamat.2012.08.018
https://doi.org/10.5539/jmsr.v5n3p1


 53%|█████▎    | 378/716 [01:31<00:49,  6.79it/s]

https://doi.org/10.3390/ma11020317
https://doi.org/10.1063/1.5064531
https://doi.org/10.1016/j.jmps.2016.08.002


 53%|█████▎    | 380/716 [01:31<00:42,  7.99it/s]

https://doi.org/10.5539/apr.v7n6p1
https://doi.org/none_20756763


 53%|█████▎    | 381/716 [01:31<00:46,  7.15it/s]

https://doi.org/10.1016/j.tsf.2014.12.019
https://doi.org/10.3390/ma10070813


 54%|█████▎    | 384/716 [01:32<00:43,  7.66it/s]

https://doi.org/10.5772/15988
https://doi.org/10.1016/j.ijsolstr.2016.03.030


 54%|█████▍    | 386/716 [01:32<00:50,  6.51it/s]

https://doi.org/10.1088/2053-1583/aaded7
https://doi.org/10.1016/j.cma.2016.03.011


 54%|█████▍    | 388/716 [01:32<00:42,  7.65it/s]

https://doi.org/10.1186/1556-276x-6-502
https://doi.org/10.1051/snamc/201401302


 54%|█████▍    | 390/716 [01:33<00:49,  6.57it/s]

https://doi.org/10.1038/srep31047
https://doi.org/10.1021/acsomega.9b00174


 55%|█████▍    | 392/716 [01:33<00:48,  6.65it/s]

https://doi.org/10.1038/s41524-017-0056-5
https://doi.org/10.1039/c4cp03398a


 55%|█████▌    | 394/716 [01:33<00:45,  7.01it/s]

https://doi.org/10.2478/s11534-006-0028-8
https://doi.org/10.1126/sciadv.aau8044


 55%|█████▌    | 396/716 [01:33<00:44,  7.15it/s]

https://doi.org/10.1016/j.mechmat.2015.02.007
https://doi.org/10.1007/s00466-018-1632-3


 56%|█████▌    | 398/716 [01:34<00:51,  6.23it/s]

https://doi.org/10.1038/srep12177
https://doi.org/none_17936269


 56%|█████▌    | 400/716 [01:34<00:40,  7.71it/s]

https://doi.org/10.1016/j.ssc.2017.11.003
https://doi.org/10.1088/0953-8984/25/13/135002
https://doi.org/none_18350768


 56%|█████▋    | 403/716 [01:34<00:47,  6.54it/s]

https://doi.org/10.1021/acs.jpcc.5b08350
https://doi.org/none_13945976


 57%|█████▋    | 405/716 [01:35<00:46,  6.76it/s]

https://doi.org/10.1016/j.jmps.2014.06.007
https://doi.org/10.1038/srep00194


 57%|█████▋    | 407/716 [01:35<00:48,  6.34it/s]

https://doi.org/10.5772/17946
https://doi.org/10.1021/acs.jpcc.9b02716


 57%|█████▋    | 409/716 [01:35<00:39,  7.70it/s]

https://doi.org/10.1038/s41598-018-20997-8
https://doi.org/10.1088/0965-0393/4/1/004


 57%|█████▋    | 411/716 [01:36<00:46,  6.54it/s]

https://doi.org/10.1007/s10853-016-0351-4
https://doi.org/10.2138/am-2015-4862


 58%|█████▊    | 413/716 [01:36<00:39,  7.74it/s]

https://doi.org/10.4236/njgc.2016.63005
https://doi.org/10.1080/14786435.2012.747012
https://doi.org/10.24297/jap.v14i3.7601


 58%|█████▊    | 416/716 [01:36<00:37,  7.91it/s]

https://doi.org/none_28182591
https://doi.org/10.1016/j.jallcom.2016.04.055


 58%|█████▊    | 417/716 [01:36<00:41,  7.14it/s]

https://doi.org/10.1073/pnas.1306371110
https://doi.org/none_4818846


 59%|█████▊    | 420/716 [01:37<00:38,  7.64it/s]

https://doi.org/10.1103/physrevb.63.224106
https://doi.org/10.1038/srep01039
https://doi.org/10.1103/physrevb.76.214105


 59%|█████▉    | 423/716 [01:37<00:38,  7.56it/s]

https://doi.org/10.2174/1573413712666160530105707
https://doi.org/10.1103/physrevb.73.045206


 59%|█████▉    | 425/716 [01:37<00:39,  7.42it/s]

https://doi.org/10.1007/s40870-016-0080-4
https://doi.org/10.1007/s00161-010-0169-2


 60%|█████▉    | 427/716 [01:38<00:40,  7.06it/s]

https://doi.org/10.1038/srep39042
https://doi.org/10.1038/s41524-018-0062-2


 60%|█████▉    | 429/716 [01:38<00:42,  6.78it/s]

https://doi.org/10.1021/es5043782
https://doi.org/10.1038/srep05167


 60%|██████    | 432/716 [01:38<00:33,  8.42it/s]

https://doi.org/10.1016/j.actamat.2015.11.037
https://doi.org/10.1038/s41467-017-01305-w
https://doi.org/10.1088/2053-1583/3/2/025033


 61%|██████    | 435/716 [01:39<00:33,  8.41it/s]

https://doi.org/10.1038/s41524-018-0112-9
https://doi.org/none_1920016
https://doi.org/10.1063/1.2724570


 61%|██████    | 438/716 [01:39<00:31,  8.69it/s]

https://doi.org/10.1016/j.ijengsci.2014.02.018
https://doi.org/10.1038/s41598-019-46672-0
https://doi.org/10.1126/sciadv.1700176


 62%|██████▏   | 441/716 [01:39<00:29,  9.48it/s]

https://doi.org/10.1016/j.carbon.2015.04.044
https://doi.org/10.1557/jmr.2019.19
https://doi.org/10.1088/0965-0393/17/5/055004


 62%|██████▏   | 443/716 [01:40<00:32,  8.48it/s]

https://doi.org/10.3390/nano9040552
https://doi.org/10.1021/acsnano.6b03963


 62%|██████▏   | 445/716 [01:40<00:39,  6.86it/s]

https://doi.org/10.1186/s13321-019-0369-0
https://doi.org/10.1016/j.physa.2017.02.077


 62%|██████▏   | 447/716 [01:40<00:40,  6.70it/s]

https://doi.org/10.1063/1.4905549
https://doi.org/10.1155/2014/365642


 63%|██████▎   | 449/716 [01:40<00:33,  7.96it/s]

https://doi.org/10.1016/j.jmps.2012.09.008
https://doi.org/10.1016/j.cirp.2017.05.004
https://doi.org/none_20146078


 63%|██████▎   | 452/716 [01:41<00:33,  7.82it/s]

https://doi.org/10.1021/acs.jpcb.9b04298
https://doi.org/10.1007/s11051-017-4105-2


 63%|██████▎   | 454/716 [01:41<00:39,  6.61it/s]

https://doi.org/10.19113/sdufbed.37948
https://doi.org/10.1103/physrevb.89.094102


 64%|██████▎   | 456/716 [01:41<00:33,  7.66it/s]

https://doi.org/none_28657560
https://doi.org/10.1103/physrevb.83.054116


 64%|██████▍   | 458/716 [01:42<00:34,  7.47it/s]

https://doi.org/10.1007/s10853-016-9834-6
https://doi.org/10.1016/j.physe.2018.11.025
https://doi.org/10.1103/revmodphys.82.1459


 64%|██████▍   | 460/716 [01:42<00:31,  8.06it/s]

https://doi.org/10.1016/j.jnucmat.2016.03.017
https://doi.org/10.1016/j.jnucmat.2010.05.017


 65%|██████▍   | 464/716 [01:42<00:31,  8.05it/s]

https://doi.org/10.1081/fst-200039164
https://doi.org/10.1103/physrevb.85.245102
https://doi.org/10.1103/physrevb.31.5262


 65%|██████▌   | 466/716 [01:43<00:33,  7.56it/s]

https://doi.org/10.1088/0965-0393/25/1/014001
https://doi.org/10.1021/acs.jpcb.7b12358


 65%|██████▌   | 468/716 [01:43<00:29,  8.32it/s]

https://doi.org/none_23942303
https://doi.org/10.3390/app7111193


 66%|██████▌   | 470/716 [01:43<00:31,  7.87it/s]

https://doi.org/10.1103/physrevb.86.245203
https://doi.org/10.5194/acp-2017-1013


 66%|██████▌   | 471/716 [01:43<00:35,  6.93it/s]

https://doi.org/10.1007/s12274-012-0267-5
https://doi.org/10.1016/j.ijsolstr.2011.06.004


 66%|██████▋   | 475/716 [01:44<00:29,  8.11it/s]

https://doi.org/10.1038/srep03635
https://doi.org/10.1111/maps.12268
https://doi.org/10.1088/1361-651x/aaaf94


 67%|██████▋   | 477/716 [01:44<00:31,  7.50it/s]

https://doi.org/10.1038/s41598-017-18254-5
https://doi.org/10.1021/acsami.8b07925


 67%|██████▋   | 480/716 [01:44<00:26,  8.93it/s]

https://doi.org/10.1186/s11671-019-3123-7
https://doi.org/10.1080/01418619708207198
https://doi.org/10.11648/j.ijctc.20130103.11


 67%|██████▋   | 482/716 [01:45<00:25,  9.32it/s]

https://doi.org/10.1016/j.cpc.2006.06.003
https://doi.org/10.3390/lubricants4030024
https://doi.org/10.3390/molecules24061103


 68%|██████▊   | 484/716 [01:45<00:24,  9.57it/s]

https://doi.org/10.1088/0965-0393/17/2/025010
https://doi.org/10.1080/21663831.2018.1503198


 68%|██████▊   | 487/716 [01:45<00:29,  7.79it/s]

https://doi.org/10.1088/1361-648x/aaafb3
https://doi.org/10.1016/j.carbon.2016.02.080


 68%|██████▊   | 489/716 [01:46<00:29,  7.58it/s]

https://doi.org/10.1007/s10659-015-9568-8
https://doi.org/10.1016/j.ijsolstr.2009.07.006


 69%|██████▊   | 492/716 [01:46<00:25,  8.85it/s]

https://doi.org/10.1063/1.4922611
https://doi.org/none_19593622
https://doi.org/10.1145/2503210.2503235


 69%|██████▉   | 494/716 [01:46<00:27,  8.02it/s]

https://doi.org/10.1557/opl.2015.745
https://doi.org/10.1016/j.apcatb.2014.06.032


 69%|██████▉   | 497/716 [01:46<00:23,  9.18it/s]

https://doi.org/10.1016/j.compositesb.2016.04.012
https://doi.org/10.1088/0965-0393/12/4/007
https://doi.org/10.1021/acsomega.8b00707


 70%|██████▉   | 499/716 [01:47<00:26,  8.18it/s]

https://doi.org/10.1016/j.commatsci.2014.10.062
https://doi.org/10.1098/rsta.2009.0252


 70%|██████▉   | 501/716 [01:47<00:31,  6.79it/s]

https://doi.org/10.1016/j.commatsci.2014.12.001
https://doi.org/10.1016/j.mtla.2019.100416


 70%|███████   | 503/716 [01:47<00:35,  6.08it/s]

https://doi.org/10.1016/j.jmps.2016.08.007
https://doi.org/10.1007/s11671-008-9119-3


 71%|███████   | 506/716 [01:48<00:26,  7.93it/s]

https://doi.org/10.1038/srep13228
https://doi.org/10.1063/1.4997091
https://doi.org/10.1007/s00170-015-7051-0


 71%|███████   | 508/716 [01:48<00:28,  7.18it/s]

https://doi.org/10.1007/s10853-016-0700-3
https://doi.org/10.7494/csci.2013.14.1.27


 71%|███████   | 510/716 [01:48<00:33,  6.22it/s]

https://doi.org/10.3390/nano9020218
https://doi.org/10.1038/s41598-017-11139-7


 72%|███████▏  | 512/716 [01:49<00:34,  5.86it/s]

https://doi.org/10.1103/physrevmaterials.3.023804
https://doi.org/10.1021/jp505554w


 72%|███████▏  | 514/716 [01:49<00:36,  5.60it/s]

https://doi.org/10.5772/16823
https://doi.org/10.1186/s11671-018-2831-8


 72%|███████▏  | 517/716 [01:50<00:28,  6.93it/s]

https://doi.org/10.1007/s10853-018-3139-x
https://doi.org/10.1016/j.carbon.2014.05.061
https://doi.org/10.1016/j.commatsci.2014.11.047


 72%|███████▏  | 519/716 [01:50<00:24,  7.94it/s]

https://doi.org/10.1103/physrevx.9.031016
https://doi.org/none_21683541


 73%|███████▎  | 522/716 [01:50<00:23,  8.28it/s]

https://doi.org/none_27349239
https://doi.org/10.3390/nano8100856
https://doi.org/10.1021/jp404095x


 73%|███████▎  | 524/716 [01:50<00:21,  9.10it/s]

https://doi.org/10.1103/physrevb.37.3924
https://doi.org/10.1186/1556-276x-7-164
https://doi.org/10.1088/0953-8984/27/8/083001


 74%|███████▎  | 528/716 [01:51<00:21,  8.82it/s]

https://doi.org/10.17509/ijost.v2i2.7987
https://doi.org/none_9096290
https://doi.org/10.3390/e16010322


 74%|███████▍  | 530/716 [01:51<00:25,  7.27it/s]

https://doi.org/10.3390/biomimetics4010012
https://doi.org/10.1103/physrevb.78.054121


 74%|███████▍  | 532/716 [01:51<00:25,  7.31it/s]

https://doi.org/10.5772/17725
https://doi.org/10.1016/j.ijsolstr.2006.03.018


 75%|███████▍  | 535/716 [01:52<00:22,  7.90it/s]

https://doi.org/10.1557/mrc.2013.37
https://doi.org/10.3390/coatings7060083
https://doi.org/10.1038/s41598-018-22011-7


 75%|███████▌  | 538/716 [01:52<00:19,  8.92it/s]

https://doi.org/10.3390/c3040032
https://doi.org/10.1007/s11671-009-9268-z
https://doi.org/10.1016/j.mspro.2014.06.271


 75%|███████▌  | 540/716 [01:52<00:22,  7.96it/s]

https://doi.org/10.1038/s41467-019-10343-5
https://doi.org/10.1021/jp510951s


 76%|███████▌  | 542/716 [01:53<00:23,  7.25it/s]

https://doi.org/10.1016/j.commatsci.2016.11.006
https://doi.org/10.1155/2012/756791


 76%|███████▌  | 544/716 [01:53<00:23,  7.26it/s]

https://doi.org/10.1007/s10832-017-0093-y
https://doi.org/10.1016/j.commatsci.2018.10.021


 76%|███████▋  | 547/716 [01:53<00:19,  8.63it/s]

https://doi.org/10.1038/ncomms11816
https://doi.org/10.1016/j.intermet.2016.05.009
https://doi.org/10.1016/j.jcp.2015.10.009


 77%|███████▋  | 549/716 [01:53<00:18,  9.20it/s]

https://doi.org/10.1088/0965-0393/21/1/015009
https://doi.org/10.1038/s41598-019-42187-w
https://doi.org/10.1016/j.commatsci.2014.11.030


 77%|███████▋  | 552/716 [01:54<00:21,  7.68it/s]

https://doi.org/10.1021/acs.chemrev.5b00644
https://doi.org/10.1115/1.4038130


 77%|███████▋  | 554/716 [01:54<00:24,  6.62it/s]

https://doi.org/10.3390/nano8070546
https://doi.org/10.1177/1094342007085015


 78%|███████▊  | 557/716 [01:55<00:19,  8.13it/s]

https://doi.org/10.1098/rsta.2011.0208
https://doi.org/10.1016/j.commatsci.2019.02.024
https://doi.org/10.1016/j.ijheatmasstransfer.2019.01.074


 78%|███████▊  | 560/716 [01:55<00:17,  9.06it/s]

https://doi.org/10.1515/mesbi-2016-0007
https://doi.org/10.1016/j.wear.2012.02.010
https://doi.org/10.1103/physrevb.38.3318


 78%|███████▊  | 562/716 [01:55<00:19,  8.08it/s]

https://doi.org/10.1111/ffe.12189
https://doi.org/10.3390/cryst8050231


 79%|███████▉  | 564/716 [01:56<00:23,  6.49it/s]

https://doi.org/10.1186/1556-276x-8-312
https://doi.org/10.1038/ncomms4186


 79%|███████▉  | 566/716 [01:56<00:23,  6.43it/s]

https://doi.org/10.3390/a2010410
https://doi.org/10.1038/sdata.2017.57


 79%|███████▉  | 568/716 [01:56<00:23,  6.35it/s]

https://doi.org/10.1088/0960-1317/23/10/103001
https://doi.org/10.1007/s12274-009-9015-x


 79%|███████▉  | 569/716 [01:56<00:20,  7.03it/s]

https://doi.org/none_9108950
https://doi.org/10.1007/s00205-018-1284-7


 80%|████████  | 573/716 [01:57<00:16,  8.71it/s]

https://doi.org/10.5772/36394
https://doi.org/10.1103/physrevb.87.104114
https://doi.org/10.2172/1040790


 80%|████████  | 575/716 [01:57<00:17,  7.86it/s]

https://doi.org/10.1155/2010/742127
https://doi.org/10.1155/2017/8296458


 81%|████████  | 577/716 [01:57<00:19,  7.15it/s]

https://doi.org/10.1186/1556-276x-6-352
https://doi.org/10.1016/j.jmps.2019.07.018


 81%|████████  | 579/716 [01:58<00:22,  6.10it/s]

https://doi.org/10.1137/100806242
https://doi.org/10.1088/0965-0393/24/1/015002


 81%|████████  | 581/716 [01:58<00:23,  5.74it/s]

https://doi.org/10.5539/jmsr.v6n4p88
https://doi.org/10.1186/s11671-019-3116-6


 81%|████████▏ | 582/716 [01:58<00:23,  5.59it/s]

https://doi.org/10.1021/acs.langmuir.6b00934
https://doi.org/10.1046/j.1365-2818.1999.00452.x


 82%|████████▏ | 586/716 [01:59<00:17,  7.41it/s]

https://doi.org/10.1016/j.jallcom.2015.10.274
https://doi.org/10.1038/s41524-019-0181-4
https://doi.org/10.1117/12.840979


 82%|████████▏ | 589/716 [01:59<00:16,  7.92it/s]

https://doi.org/10.1021/acsnano.7b05815
https://doi.org/10.1103/physrevb.71.035211
https://doi.org/10.1007/s10704-017-0246-7


 83%|████████▎ | 591/716 [01:59<00:16,  7.66it/s]

https://doi.org/10.3390/min4020519
https://doi.org/10.1038/srep11290


 83%|████████▎ | 593/716 [02:00<00:17,  7.20it/s]

https://doi.org/none_21795708
https://doi.org/10.1073/pnas.1705723114


 83%|████████▎ | 595/716 [02:00<00:19,  6.32it/s]

https://doi.org/10.1016/s1359-6454(00)00002-1
https://doi.org/10.1103/physrevb.85.115206


 83%|████████▎ | 597/716 [02:00<00:20,  5.86it/s]

https://doi.org/10.1007/s00269-015-0762-9
https://doi.org/10.1016/j.cma.2015.06.001


 84%|████████▎ | 599/716 [02:01<00:20,  5.65it/s]

https://doi.org/10.1016/j.ijsolstr.2013.06.002
https://doi.org/10.1016/j.nimb.2017.09.012


 84%|████████▍ | 601/716 [02:01<00:18,  6.25it/s]

https://doi.org/10.1007/s00466-013-0927-7
https://doi.org/10.1021/acs.jpcc.5b01905


 84%|████████▍ | 602/716 [02:01<00:18,  6.06it/s]

https://doi.org/10.1073/pnas.1412962111


 84%|████████▍ | 604/716 [02:02<00:20,  5.48it/s]

https://doi.org/10.1103/physreve.82.016704
https://doi.org/10.1080/08927022.2012.671942


 85%|████████▍ | 606/716 [02:02<00:18,  5.84it/s]

https://doi.org/10.3390/met7030073
https://doi.org/10.2991/wartia-17.2017.66


 85%|████████▍ | 607/716 [02:02<00:19,  5.72it/s]

https://doi.org/10.5772/23794
https://doi.org/10.1088/1367-2630/9/9/325


 85%|████████▌ | 610/716 [02:03<00:17,  6.04it/s]

https://doi.org/10.1038/srep09084
https://doi.org/10.1016/s1359-6454(98)00038-x


 85%|████████▌ | 612/716 [02:03<00:15,  6.57it/s]

https://doi.org/10.5772/52592
https://doi.org/10.1016/j.nimb.2013.10.003


 86%|████████▌ | 614/716 [02:03<00:14,  6.89it/s]

https://doi.org/10.1038/srep11546
https://doi.org/10.1016/j.carbon.2010.06.004
https://doi.org/10.1021/acs.jctc.7b00092


 86%|████████▌ | 617/716 [02:04<00:14,  6.60it/s]

https://doi.org/10.1016/j.actamat.2018.03.055
https://doi.org/10.1103/physrevb.66.035205


 86%|████████▋ | 619/716 [02:04<00:13,  6.93it/s]

https://doi.org/10.1103/physrevb.81.235404
https://doi.org/10.1007/s00894-018-3829-y


 87%|████████▋ | 620/716 [02:04<00:14,  6.45it/s]

https://doi.org/10.1016/j.nimb.2010.11.017
https://doi.org/10.1016/j.actamat.2015.12.026


 87%|████████▋ | 622/716 [02:04<00:13,  6.83it/s]

https://doi.org/10.1016/j.jnoncrysol.2016.02.008
https://doi.org/none_21013761


 87%|████████▋ | 624/716 [02:05<00:12,  7.10it/s]

https://doi.org/10.1103/physrevlett.91.098301
https://doi.org/10.1088/0965-0393/21/3/035009


 88%|████████▊ | 627/716 [02:05<00:10,  8.17it/s]

https://doi.org/10.3329/jme.v40i2.5346
https://doi.org/10.1002/polb.24539


 88%|████████▊ | 629/716 [02:05<00:09,  8.72it/s]

https://doi.org/10.1016/j.jmps.2019.103731
https://doi.org/10.1073/pnas.1705978114


 88%|████████▊ | 631/716 [02:05<00:12,  6.81it/s]

https://doi.org/10.3390/met7120570
https://doi.org/10.1080/14786430902832773


 89%|████████▊ | 634/716 [02:06<00:10,  7.72it/s]

https://doi.org/10.1016/j.jmps.2013.04.008
https://doi.org/none_5285167
https://doi.org/10.1080/02670836.2016.1204064


 89%|████████▉ | 637/716 [02:06<00:08,  8.84it/s]

https://doi.org/10.1155/2011/252591
https://doi.org/10.3390/cryst8030116
https://doi.org/10.1038/s41467-018-03972-9


 89%|████████▉ | 639/716 [02:06<00:08,  9.41it/s]

https://doi.org/10.1051/esomat/200903008
https://doi.org/10.1016/j.jmps.2016.02.014
https://doi.org/10.1080/14786430903258184


 90%|████████▉ | 643/716 [02:07<00:07,  9.91it/s]

https://doi.org/10.1038/srep18892
https://doi.org/10.1529/biophysj.104.047332
https://doi.org/10.3390/cryst8080321


 90%|█████████ | 645/716 [02:07<00:07,  8.95it/s]

https://doi.org/10.1016/j.carbon.2014.09.031
https://doi.org/10.3390/ma10010088


 91%|█████████ | 648/716 [02:07<00:07,  8.74it/s]

https://doi.org/10.5772/36936
https://doi.org/10.1016/j.ijsolstr.2014.11.025
https://doi.org/10.1063/1.2124667


 91%|█████████ | 650/716 [02:08<00:07,  8.90it/s]

https://doi.org/10.1117/12.341254
https://doi.org/10.1098/rspa.2005.1567


 91%|█████████ | 653/716 [02:08<00:06,  9.48it/s]

https://doi.org/10.2481/dsj.007-051
https://doi.org/10.1038/srep40969
https://doi.org/10.1063/1.5086167


 91%|█████████▏| 655/716 [02:08<00:07,  8.32it/s]

https://doi.org/10.1016/j.jcp.2011.12.006
https://doi.org/10.1155/2016/8231592


 92%|█████████▏| 657/716 [02:09<00:08,  6.63it/s]

https://doi.org/10.1038/s41467-018-06166-5
https://doi.org/10.1103/physrevb.85.125204


 92%|█████████▏| 658/716 [02:09<00:07,  7.30it/s]

https://doi.org/10.1021/jp801931d


 92%|█████████▏| 660/716 [02:09<00:09,  5.86it/s]

https://doi.org/10.1016/j.jmps.2018.03.008
https://doi.org/10.1016/j.ijmecsci.2017.06.026


 92%|█████████▏| 662/716 [02:09<00:08,  6.47it/s]

https://doi.org/10.4208/cicp.oa-2017-0213
https://doi.org/10.1137/16m106978x


 93%|█████████▎| 664/716 [02:10<00:06,  7.60it/s]

https://doi.org/10.1016/j.actamat.2003.11.026
https://doi.org/10.1103/physrevb.37.6991


 93%|█████████▎| 666/716 [02:10<00:07,  7.11it/s]

https://doi.org/10.1016/j.ijsolstr.2011.06.022
https://doi.org/10.1038/s41467-018-07102-3


 93%|█████████▎| 668/716 [02:10<00:06,  7.06it/s]

https://doi.org/10.1007/s10853-016-0569-1
https://doi.org/10.1186/1556-276x-9-622


 94%|█████████▎| 670/716 [02:10<00:06,  7.08it/s]

https://doi.org/10.3897/rio.1.e7479
https://doi.org/10.1088/0034-4885/78/6/066501


 94%|█████████▍| 672/716 [02:11<00:05,  7.85it/s]

https://doi.org/10.1016/j.mssp.2016.05.003
https://doi.org/10.1016/j.jnucmat.2016.07.048


 94%|█████████▍| 674/716 [02:11<00:05,  7.37it/s]

https://doi.org/10.1103/physrevb.46.2250
https://doi.org/10.1126/sciadv.aat8195


 94%|█████████▍| 675/716 [02:11<00:06,  6.83it/s]

https://doi.org/10.1007/s10409-012-0124-5
https://doi.org/10.3390/cryst8020064


 95%|█████████▍| 678/716 [02:12<00:05,  6.59it/s]

https://doi.org/10.3390/polym10050475
https://doi.org/10.3390/min4020208


 95%|█████████▍| 680/716 [02:12<00:05,  6.84it/s]

https://doi.org/10.1088/1742-6596/905/1/012018
https://doi.org/10.1080/14686996.2017.1312519
https://doi.org/10.1021/acsomega.8b01767


 95%|█████████▌| 683/716 [02:12<00:04,  6.62it/s]

https://doi.org/10.1088/1361-6668/aafa88
https://doi.org/10.1038/ncomms10424


 96%|█████████▌| 686/716 [02:13<00:03,  7.56it/s]

https://doi.org/10.3390/cryst7080240
https://doi.org/10.1109/sc.2016.6
https://doi.org/10.1016/s1359-6454(99)00186-x


 96%|█████████▌| 687/716 [02:13<00:04,  7.10it/s]

https://doi.org/10.3390/met8020120
https://doi.org/10.1038/s41598-017-08455-3


 96%|█████████▋| 690/716 [02:13<00:03,  7.42it/s]

https://doi.org/10.1103/physrevb.73.024116
https://doi.org/10.1080/14786435.2018.1459059


 97%|█████████▋| 692/716 [02:14<00:03,  7.35it/s]

https://doi.org/10.1016/j.cocom.2018.e00330
https://doi.org/10.1039/c4cp03781b


 97%|█████████▋| 695/716 [02:14<00:03,  6.78it/s]

https://doi.org/10.1038/s41524-017-0031-1
https://doi.org/10.17632/wj2cy3kvy4.1
https://doi.org/10.1016/j.cma.2011.01.012


 97%|█████████▋| 698/716 [02:14<00:02,  8.30it/s]

https://doi.org/10.1016/j.cpc.2015.03.015
https://doi.org/10.1038/srep39708
https://doi.org/10.3389/fchem.2013.00006


 98%|█████████▊| 700/716 [02:15<00:02,  7.90it/s]

https://doi.org/10.1016/j.susc.2007.12.023
https://doi.org/10.1103/physrevb.65.224114
https://doi.org/10.1088/0953-8984/28/10/105002


 98%|█████████▊| 702/716 [02:15<00:01,  7.60it/s]

https://doi.org/10.1103/physrevmaterials.2.113403
https://doi.org/10.3390/catal8050192


 98%|█████████▊| 705/716 [02:15<00:01,  7.81it/s]

https://doi.org/none_26172483
https://doi.org/10.1002/nme.944


 99%|█████████▉| 708/716 [02:16<00:00,  8.01it/s]

https://doi.org/10.1038/s41598-017-10096-5
https://doi.org/10.18038/aubtda.405147
https://doi.org/10.2514/6.2007-5313


 99%|█████████▉| 710/716 [02:16<00:00,  6.80it/s]

https://doi.org/10.1016/s0370-1573(02)00633-6
https://doi.org/10.1080/00268970701730096


 99%|█████████▉| 712/716 [02:16<00:00,  7.93it/s]

https://doi.org/10.1016/j.surfcoat.2016.04.053
https://doi.org/none_24264187
https://doi.org/10.1007/s10659-010-9249-6


100%|█████████▉| 715/716 [02:17<00:00,  7.80it/s]

https://doi.org/10.1155/2013/641581
https://doi.org/10.5772/17892


100%|██████████| 716/716 [02:17<00:00,  5.22it/s]

https://doi.org/10.1016/j.commatsci.2013.04.014





In [23]:
len(graphs)

204

In [28]:
url = 'https://api.semanticscholar.org/graph/v1/paper/DOI:10.1016/j.commatsci.2013.04.014?fields=citations,references'

res = requests.get(url)
print(res.status_code)
print(res.json())

429
{'message': 'Too Many Requests'}


In [3]:
data

<Response [200]>

In [4]:
data.json()

{'paperId': '649def34f8be52c8b66281af98ae884c09aef38b',
 'citations': [{'paperId': 'b74aec118f2b62ae05b04f1b66ab79c2e5b873c0',
   'title': 'MRT: Tracing the Evolution of Scientific Publications'},
  {'paperId': '25b77db5bfca92029532ca70ee659fdf88db8484',
   'title': 'SMAuC - The Scientific Multi-Authorship Corpus'},
  {'paperId': '7e0fda71cc2e561385c0a2e29f5a81654a11157f',
   'title': 'VarMAE: Pre-training of Variational Masked Autoencoder for Domain-adaptive Language Understanding'},
  {'paperId': '4a236906f5bed6385c7b3bf3f10a0099e41d4566',
   'title': 'Semantic-Native Communication: A Simplicial Complex Perspective'},
  {'paperId': '97394fd6876dd10a0bdf233beb8216f16e074bee',
   'title': 'Visual Exploration of Literature with Argo Scholar'},
  {'paperId': '42b2fd8a0ab69281022de528c591c665f5f2ad3b',
   'title': 'A Multi-Domain Benchmark for Personalized Search Evaluation'},
  {'paperId': 'e92b2ada3a8112426946f3acd8991dbc74d4b311',
   'title': 'KnowledgeShovel: An AI-in-the-Loop Documen

In [8]:
import urllib.request
urllib.request.urlretrieve(data.json()['openAccessPdf']['url'], 'test.pdf')

HTTPError: HTTP Error 406: Not Acceptable

In [11]:
wget.download('https://export.arxiv.org/pdf/2009.12710.pdf', 'test.pdf')

'test (1).pdf'

In [36]:
workfolder = '/export/scratch/zeren/Papers2json/DeepCiteAll/'
filename = os.path.join(workfolder, 'openkim-model-citations/outputs/citing_papers.json')
citations = json.load(open(filename, 'r'))

citing_papers = {}
for cited_doi, c in citations.items():
    for citing_paper in c['citing_papers']:
        citing_doi = citing_paper['citing_doi']

        if citing_doi in citing_papers:
            citing_papers[citing_doi] += 1
        else:
            citing_papers[citing_doi] = 1
citing_papers.pop(None)

3488

In [33]:
publishers = [
    'acs',
    'aip',
    'iop',
    'rsc',
    'springer',
    'taylor_and_francis',
    'wiley',
    'unpaywall',
    'elsevier'
]

def get_doi_filename(publisher):
    return os.path.join(
        workfolder, 'deep-citation-additional-papers/inputs/{}/doi_to_shasum.txt'.format(publisher)
    )

def get_dois(publisher):
    doi_filename = get_doi_filename(publisher)

    with open(doi_filename, 'r') as f:
        doi_shasum_list = f.readlines()
    
    dois = []
    shasums = []
    for line in doi_shasum_list:
        dois.append(list(literal_eval(line).keys())[0])
        shasums.append(list(literal_eval(line).values())[0])
    return dois, shasums

Dois = []
Shasums = []
for p in publishers:
    dois, shasums = get_dois(p)

    Dois += dois
    Shasums += shasums
citing_doi_with_pdf = list(set(Dois))

In [37]:
citing_doi_wo_pdf = np.setdiff1d(list(citing_papers.keys()), citing_doi_with_pdf)

In [46]:
len(citing_doi_wo_pdf)

13340

In [61]:
hasOpenAccess = []
OpenAccessUrls = []
hasArxivAccess = []

for doi in tqdm(citing_doi_wo_pdf):
    url = 'https://api.semanticscholar.org/graph/v1/paper/DOI:{}?fields=isOpenAccess,openAccessPdf'.format(doi)

    data = requests.get(url)
    
    if data.status_code == 200:
        data = data.json()
        if data['isOpenAccess']:
            hasOpenAccess.append(doi)
            pdf_url = data['openAccessPdf']['url']
            OpenAccessUrls.append(pdf_url)
            if 'arxiv' in pdf_url:
                hasArxivAccess.append(doi)

100%|██████████| 13340/13340 [28:37<00:00,  7.77it/s] 


In [67]:
len(citing_papers), len()

28955

In [63]:
len(hasOpenAccess), len(hasArxivAccess)

(39, 7)

In [66]:
OpenAccessUrls

['http://www.homepages.ucl.ac.uk/~ucfbdxa/pubblicazioni/ijqc.pdf',
 'http://arxiv.org/pdf/cond-mat/0107195',
 'http://arxiv.org/pdf/cond-mat/0003232',
 'http://dspace.lib.cranfield.ac.uk/bitstream/1826/8722/1/Microsoft%20Word%20-%20oxide%20nanomaterials.pdf',
 'http://arxiv.org/pdf/1604.07959',
 'https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/9781119176817.ecm2107',
 'https://digital.csic.es/bitstream/10261/97383/1/Modeling%20the%20properties%20of%20carbon.pdf',
 'https://infoscience.epfl.ch/record/133949/files/paper_426.pdf',
 'http://arxiv.org/pdf/1211.5036',
 'https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/adem.202000207',
 'https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/adfm.201504085',
 'https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/adfm.202104250',
 'https://rss.onlinelibrary.wiley.com/doi/am-pdf/10.1002/adma.201603009',
 'http://arxiv.org/pdf/1805.06163',
 'https://rss.onlinelibrary.wiley.com/doi/am-pdf/10.1002/adma.201802306',
 'https://onlinelibrar

In [60]:
requests.get(url).status_code

404