# The Unconquerables of Open Access

## Importing Sherpa/Romeo data for MEDLINE journals

Project for the EAHIL conference 2023 : https://eahil2023.org/
Authors : **Floriane Muller & Pablo Iriarte**, University of Geneva  
Last update : 12.04.2023

This purpose of this notebook is to import the Sherpa/Romeo data for the PubMed journals list

### Sources

* Export of NLM Journals currently indexed on MEDLINE

In [1]:
import json
import requests
import codecs
import pandas as pd
import time
import os



In [2]:
# Open extracted data
pubmed = pd.read_csv('data/sources/nlm/lsi2023.tsv', delimiter='\t', header=0)
pubmed

Unnamed: 0,NlmUniqueID,Title,MedlineTA,PublicationInfo/Country,PublicationInfo/Place,PublicationInfo/Publisher,PublicationInfo/PublicationFirstYear,PublicationInfo/PublicationEndYear,PublicationInfo/Frequency,"ISSN[@IssnType=""Electronic""]",...,ISSNLinking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN,Unnamed: 20
0,9875136,1199 news. National Union of Hospital and Heal...,1199 News,United States,New York,National Union of Hospital and Health Care Emp...,19uu,,"8 issues a year,",,...,0012-6535,eng,N,,N,N,H,,Y,
1,9015384,20 century British history,20 Century Br Hist,England,"Eynsham, Oxford",Oxford University Press,1990,,"4 no. a year,",1477-4674,...,0955-2359,eng,N,1990.0,Y,N,QIS,,Y,
2,101637720,A & A case reports,A A Case Rep,United States,"[New York, NY]",Wolters Kluwer Health / OvidSP,2013,2017,Biweekly,2325-7237,...,2325-7237,eng,N,,N,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y,
3,101714112,A&A practice,A A Pract,United States,"[Philadelphia, PA]","Wolters Kluwer Health, Inc.",2018,,Biweekly,2575-3126,...,2575-3126,eng,Y,2018.0,Y,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y,
4,101269322,AACN advanced critical care,AACN Adv Crit Care,United States,"Aliso Viejo, CA",American Association of Critical-Care Nurses (...,2006,,Quarterly,1559-7776,...,1559-7768,eng,Y,2006.0,Y,Y,N,https://aacnjournals.org/aacnacconline,Y,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15425,0056272,Zuchthygiene,Zuchthygiene,Germany,Berlin,Verlag Paul Parey,1966,1989,Six no. a year,,...,0044-5371,ger,N,,N,N,J,,Y,
15426,21830020R,Zürcher medizingeschichtliche Abhandlungen,Zur Medizingesch Abh,Switzerland,Zurich,Juris Verlag,1924,,Irregular,,...,0514-4264,ger,N,,N,N,QIS,,Y,
15427,21830080R,Zvestí c̆erveného kríz̆a,Zvesti Cerv Kriza,Slovakia,[V Bratislava,,1940,19uu,,,...,,slo,N,,N,N,OM,,Y,
15428,0233767,ZWR,ZWR,Germany,Stuttgart,Thieme,1970,,Monthly,1439-9148,...,0044-166X,ger,N,,N,N,D,https://www.thieme-connect.de/products/ejourna...,Y,


In [3]:
# del last column
del pubmed['Unnamed: 20']
pubmed

Unnamed: 0,NlmUniqueID,Title,MedlineTA,PublicationInfo/Country,PublicationInfo/Place,PublicationInfo/Publisher,PublicationInfo/PublicationFirstYear,PublicationInfo/PublicationEndYear,PublicationInfo/Frequency,"ISSN[@IssnType=""Electronic""]","ISSN[@IssnType=""Print""]",ISSNLinking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN
0,9875136,1199 news. National Union of Hospital and Heal...,1199 News,United States,New York,National Union of Hospital and Health Care Emp...,19uu,,"8 issues a year,",,0012-6535,0012-6535,eng,N,,N,N,H,,Y
1,9015384,20 century British history,20 Century Br Hist,England,"Eynsham, Oxford",Oxford University Press,1990,,"4 no. a year,",1477-4674,0955-2359,0955-2359,eng,N,1990.0,Y,N,QIS,,Y
2,101637720,A & A case reports,A A Case Rep,United States,"[New York, NY]",Wolters Kluwer Health / OvidSP,2013,2017,Biweekly,2325-7237,,2325-7237,eng,N,,N,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y
3,101714112,A&A practice,A A Pract,United States,"[Philadelphia, PA]","Wolters Kluwer Health, Inc.",2018,,Biweekly,2575-3126,,2575-3126,eng,Y,2018.0,Y,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y
4,101269322,AACN advanced critical care,AACN Adv Crit Care,United States,"Aliso Viejo, CA",American Association of Critical-Care Nurses (...,2006,,Quarterly,1559-7776,1559-7768,1559-7768,eng,Y,2006.0,Y,Y,N,https://aacnjournals.org/aacnacconline,Y
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15425,0056272,Zuchthygiene,Zuchthygiene,Germany,Berlin,Verlag Paul Parey,1966,1989,Six no. a year,,0044-5371,0044-5371,ger,N,,N,N,J,,Y
15426,21830020R,Zürcher medizingeschichtliche Abhandlungen,Zur Medizingesch Abh,Switzerland,Zurich,Juris Verlag,1924,,Irregular,,0514-4264,0514-4264,ger,N,,N,N,QIS,,Y
15427,21830080R,Zvestí c̆erveného kríz̆a,Zvesti Cerv Kriza,Slovakia,[V Bratislava,,1940,19uu,,,,,slo,N,,N,N,OM,,Y
15428,0233767,ZWR,ZWR,Germany,Stuttgart,Thieme,1970,,Monthly,1439-9148,0044-166X,0044-166X,ger,N,,N,N,D,https://www.thieme-connect.de/products/ejourna...,Y


In [4]:
# rename columns
pubmed = pubmed.rename(columns={'ISSN[@IssnType="Electronic"]' : 'ISSN-Electronic', 'ISSN[@IssnType="Print"]' : 'ISSN-Print', 'ISSNLinking' : 'ISSN-Linking'})
pubmed

Unnamed: 0,NlmUniqueID,Title,MedlineTA,PublicationInfo/Country,PublicationInfo/Place,PublicationInfo/Publisher,PublicationInfo/PublicationFirstYear,PublicationInfo/PublicationEndYear,PublicationInfo/Frequency,ISSN-Electronic,ISSN-Print,ISSN-Linking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN
0,9875136,1199 news. National Union of Hospital and Heal...,1199 News,United States,New York,National Union of Hospital and Health Care Emp...,19uu,,"8 issues a year,",,0012-6535,0012-6535,eng,N,,N,N,H,,Y
1,9015384,20 century British history,20 Century Br Hist,England,"Eynsham, Oxford",Oxford University Press,1990,,"4 no. a year,",1477-4674,0955-2359,0955-2359,eng,N,1990.0,Y,N,QIS,,Y
2,101637720,A & A case reports,A A Case Rep,United States,"[New York, NY]",Wolters Kluwer Health / OvidSP,2013,2017,Biweekly,2325-7237,,2325-7237,eng,N,,N,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y
3,101714112,A&A practice,A A Pract,United States,"[Philadelphia, PA]","Wolters Kluwer Health, Inc.",2018,,Biweekly,2575-3126,,2575-3126,eng,Y,2018.0,Y,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y
4,101269322,AACN advanced critical care,AACN Adv Crit Care,United States,"Aliso Viejo, CA",American Association of Critical-Care Nurses (...,2006,,Quarterly,1559-7776,1559-7768,1559-7768,eng,Y,2006.0,Y,Y,N,https://aacnjournals.org/aacnacconline,Y
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15425,0056272,Zuchthygiene,Zuchthygiene,Germany,Berlin,Verlag Paul Parey,1966,1989,Six no. a year,,0044-5371,0044-5371,ger,N,,N,N,J,,Y
15426,21830020R,Zürcher medizingeschichtliche Abhandlungen,Zur Medizingesch Abh,Switzerland,Zurich,Juris Verlag,1924,,Irregular,,0514-4264,0514-4264,ger,N,,N,N,QIS,,Y
15427,21830080R,Zvestí c̆erveného kríz̆a,Zvesti Cerv Kriza,Slovakia,[V Bratislava,,1940,19uu,,,,,slo,N,,N,N,OM,,Y
15428,0233767,ZWR,ZWR,Germany,Stuttgart,Thieme,1970,,Monthly,1439-9148,0044-166X,0044-166X,ger,N,,N,N,D,https://www.thieme-connect.de/products/ejourna...,Y


In [5]:
# rename columns
pubmed = pubmed.rename(columns={'PublicationInfo/Country' : 'Country',
                                'PublicationInfo/Place' : 'Place',
                                'PublicationInfo/Publisher' : 'Publisher',
                                'PublicationInfo/PublicationFirstYear' : 'PublicationFirstYear',
                                'PublicationInfo/PublicationEndYear' : 'PublicationEndYear',
                                'PublicationInfo/Frequency' : 'Frequency'
                                })
pubmed

Unnamed: 0,NlmUniqueID,Title,MedlineTA,Country,Place,Publisher,PublicationFirstYear,PublicationEndYear,Frequency,ISSN-Electronic,ISSN-Print,ISSN-Linking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN
0,9875136,1199 news. National Union of Hospital and Heal...,1199 News,United States,New York,National Union of Hospital and Health Care Emp...,19uu,,"8 issues a year,",,0012-6535,0012-6535,eng,N,,N,N,H,,Y
1,9015384,20 century British history,20 Century Br Hist,England,"Eynsham, Oxford",Oxford University Press,1990,,"4 no. a year,",1477-4674,0955-2359,0955-2359,eng,N,1990.0,Y,N,QIS,,Y
2,101637720,A & A case reports,A A Case Rep,United States,"[New York, NY]",Wolters Kluwer Health / OvidSP,2013,2017,Biweekly,2325-7237,,2325-7237,eng,N,,N,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y
3,101714112,A&A practice,A A Pract,United States,"[Philadelphia, PA]","Wolters Kluwer Health, Inc.",2018,,Biweekly,2575-3126,,2575-3126,eng,Y,2018.0,Y,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y
4,101269322,AACN advanced critical care,AACN Adv Crit Care,United States,"Aliso Viejo, CA",American Association of Critical-Care Nurses (...,2006,,Quarterly,1559-7776,1559-7768,1559-7768,eng,Y,2006.0,Y,Y,N,https://aacnjournals.org/aacnacconline,Y
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15425,0056272,Zuchthygiene,Zuchthygiene,Germany,Berlin,Verlag Paul Parey,1966,1989,Six no. a year,,0044-5371,0044-5371,ger,N,,N,N,J,,Y
15426,21830020R,Zürcher medizingeschichtliche Abhandlungen,Zur Medizingesch Abh,Switzerland,Zurich,Juris Verlag,1924,,Irregular,,0514-4264,0514-4264,ger,N,,N,N,QIS,,Y
15427,21830080R,Zvestí c̆erveného kríz̆a,Zvesti Cerv Kriza,Slovakia,[V Bratislava,,1940,19uu,,,,,slo,N,,N,N,OM,,Y
15428,0233767,ZWR,ZWR,Germany,Stuttgart,Thieme,1970,,Monthly,1439-9148,0044-166X,0044-166X,ger,N,,N,N,D,https://www.thieme-connect.de/products/ejourna...,Y


In [6]:
pubmed[['ISSN-Electronic','ISSN-Print' , 'ISSN-Linking']].loc[pubmed['ISSN-Linking'].notna()]

Unnamed: 0,ISSN-Electronic,ISSN-Print,ISSN-Linking
0,,0012-6535,0012-6535
1,1477-4674,0955-2359,0955-2359
2,2325-7237,,2325-7237
3,2575-3126,,2575-3126
4,1559-7776,1559-7768,1559-7768
...,...,...,...
15423,1175-5334,1175-5326,1175-5326
15425,,0044-5371,0044-5371
15426,,0514-4264,0514-4264
15428,1439-9148,0044-166X,0044-166X


In [7]:
pubmed[['ISSN-Electronic','ISSN-Print' , 'ISSN-Linking']].loc[pubmed['ISSN-Electronic'].isna() & pubmed['ISSN-Linking'].notna()]

Unnamed: 0,ISSN-Electronic,ISSN-Print,ISSN-Linking
0,,0012-6535,0012-6535
6,,1046-7467,1046-7467
7,,0160-6999,0160-6999
9,,0744-1479,0744-1479
11,,1054-5913,1054-5913
...,...,...,...
15417,,0044-5134,0044-5134
15418,,0289-0003,0289-0003
15422,,0044-5290,0044-5290
15425,,0044-5371,0044-5371


In [8]:
pubmed[['ISSN-Electronic','ISSN-Print' , 'ISSN-Linking']].loc[pubmed['ISSN-Electronic'].isna() & pubmed['ISSN-Print'].notna()]

Unnamed: 0,ISSN-Electronic,ISSN-Print,ISSN-Linking
0,,0012-6535,0012-6535
6,,1046-7467,1046-7467
7,,0160-6999,0160-6999
9,,0744-1479,0744-1479
11,,1054-5913,1054-5913
...,...,...,...
15418,,0289-0003,0289-0003
15421,,0514-4019,
15422,,0044-5290,0044-5290
15425,,0044-5371,0044-5371


In [9]:
# use ISSN-Electronic and ISSN-Linking or ISSN-Print for Sherpa
pubmed.loc[pubmed['ISSN-Electronic'].notna(), 'ISSN'] = pubmed['ISSN-Electronic']
pubmed.loc[pubmed['ISSN-Electronic'].isna() & pubmed['ISSN-Linking'].notna(), 'ISSN'] = pubmed['ISSN-Linking']
pubmed.loc[pubmed['ISSN-Electronic'].isna() & pubmed['ISSN-Linking'].isna(), 'ISSN'] = pubmed['ISSN-Print']
pubmed.loc[pubmed['ISSN'].isna()]

Unnamed: 0,NlmUniqueID,Title,MedlineTA,Country,Place,Publisher,PublicationFirstYear,PublicationEndYear,Frequency,ISSN-Electronic,...,ISSN-Linking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN,ISSN
23,24320650R,Abstracts. International Congress on Tropical ...,Abstr Int Congr Trop Med Malar,United States,"Washington, D. C.",U. S. Govt. Print. Off.,1948,,,,...,,eng,N,,N,N,OM,,Y,
24,59930170R,Abstracts and translations from the science li...,Abstr Translat Sci Library,United States,Hartford.,,1932,1944,,,...,,eng,N,,N,N,OM,,Y,
37,14510510R,Accademia medica,Accad Medica,Italy,"[Torino, etc.]",,1930,19uu,,,...,,und,N,,N,N,OM,,Y,
44,0137764,ACRH [reports]. U.S. Atomic Energy Commission,ACRH Rep,United States,Chicago Il,Argonne Cancer Research Hospital,1954,19uu,,,...,,eng,N,,N,N,IM,,Y,
71,14520280R,Acta argentina de fisiología y fisiopatología,Acta Argent Fisiol Fisiopatol,Argentina,[Córdoba],Univ. Nacional de Córdoba.,1950,1954,,,...,,spa,N,,N,N,OM,,Y,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15408,21820320R,De Ziekenfondsgids,Ziekenfondsgids,Netherlands,[Utrecht?],,1947,19uu,,,...,,dut,N,,N,N,OM,,Y,
15409,0035477,Het Ziekenhuiswezen,Ziekenhuiswezen,Netherlands,Lochem [Nederland],,1928,1970,,,...,,dut,N,,N,N,OM,,Y,
15411,9878612,Zimbabwe Rhodesia Nurse,Zimbabwe Rhod Nurse,Zimbabwe,Salisbury,Zimbabwe Rhodesia Nurses Association,1979,1979,Annual,,...,,eng,N,,N,N,N,,Y,
15424,21820450R,Zubolekarski pregled,Zubolekarski Pregl,Bulgaria,,,1911,1950,,,...,,bul,N,,N,N,OM,,Y,


In [10]:
pubmed_medline_issn = pubmed.loc[(pubmed['CurrentlyIndexedYN'] == 'Y') & pubmed['ISSN'].notna()]
pubmed_medline_not_issn = pubmed.loc[(pubmed['CurrentlyIndexedYN'] == 'Y') & pubmed['ISSN'].isna()]
pubmed_medline_issn

Unnamed: 0,NlmUniqueID,Title,MedlineTA,Country,Place,Publisher,PublicationFirstYear,PublicationEndYear,Frequency,ISSN-Electronic,...,ISSN-Linking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN,ISSN
1,9015384,20 century British history,20 Century Br Hist,England,"Eynsham, Oxford",Oxford University Press,1990,,"4 no. a year,",1477-4674,...,0955-2359,eng,N,1990.0,Y,N,QIS,,Y,1477-4674
3,101714112,A&A practice,A A Pract,United States,"[Philadelphia, PA]","Wolters Kluwer Health, Inc.",2018,,Biweekly,2575-3126,...,2575-3126,eng,Y,2018.0,Y,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y,2575-3126
4,101269322,AACN advanced critical care,AACN Adv Crit Care,United States,"Aliso Viejo, CA",American Association of Critical-Care Nurses (...,2006,,Quarterly,1559-7776,...,1559-7768,eng,Y,2006.0,Y,Y,N,https://aacnjournals.org/aacnacconline,Y,1559-7776
8,0431420,AANA journal,AANA J,United States,"Park Ridge, Ill.",American Association of Nurse Anesthetists,1974,,Bimonthly,2162-5239,...,0094-6354,eng,N,1974.0,Y,Y,N,https://www.aana.com/publications/aana-journal,Y,2162-5239
12,101223209,The AAPS journal,AAPS J,United States,"Arlington, Va., USA",American Association of Pharmaceutical Scientists,2004,,Four no. a year,1550-7416,...,1550-7416,eng,Y,2004.0,Y,Y,IM,https://link.springer.com/journal/12248,Y,1550-7416
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15418,8702287,Zoological science,Zoolog Sci,Japan,"Tokyo, Japan",Zoological Society of Japan,1984,,"Monthly,",,...,0289-0003,eng,N,2002.0,Y,Y,IM,http://www.bioone.org/loi/jzoo,Y,0289-0003
15419,9435608,"Zoology (Jena, Germany)",Zoology (Jena),Germany,"Jena, Germany",Urban & Fischer,1994,,"Six no. a year,",1873-2720,...,0944-2006,eng,N,2005.0,Y,Y,IM,https://www.sciencedirect.com/journal/zoology,Y,1873-2720
15420,101300786,Zoonoses and public health,Zoonoses Public Health,Germany,"Berlin, Germany",Blackwell Verlag,2007,,Ten no. a year,1863-2378,...,1863-1959,eng,Y,2007.0,Y,Y,IM,http://onlinelibrary.wiley.com/journal/10.1111...,Y,1863-2378
15423,101179386,Zootaxa,Zootaxa,New Zealand,"Auckland, N.Z.",Magnolia Press,2001,,Irregular,1175-5334,...,1175-5326,eng,N,2013.0,Y,Y,IM,http://www.mapress.com/j/zt/,Y,1175-5334


In [11]:
pubmed_medline_not_issn

Unnamed: 0,NlmUniqueID,Title,MedlineTA,Country,Place,Publisher,PublicationFirstYear,PublicationEndYear,Frequency,ISSN-Electronic,...,ISSN-Linking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN,ISSN
11647,9918487341206676,Physical therapy & rehabilitation journal,Phys Ther Rehabil J,England,"[Oxford, United Kingdom]",Oxford University Press,2021,,Monthly,,...,,eng,Y,2021.0,Y,Y,IM,https://academic.oup.com/ptj,Y,


In [12]:
# download sherpa data
issns_import = pubmed_medline_issn
for index, row in issns_import.iterrows():
    myissn = row['ISSN']
    # debug: print (myissn)
    # test d'existance du fichier avant le chargement de nouveau
    # if not os.path.exists('sources/sherpa/data/' + myissn + '.json'):
    searchurl = 'https://v2.sherpa.ac.uk/cgi/retrieve_by_id?item-type=publication&api-key=EEE6F146-678E-11EB-9C3A-202F3DE2659A&format=Json&identifier=' + myissn
    headers = {'Accept': 'application/json'}
    resp = requests.get(searchurl, headers=headers)
    # test du code pour éviter les erreurs 
    if (resp.status_code == 200):
        # export en json
        with open('data/sources/sherpa/data_2023/' + myissn + '.json', 'w', encoding='utf-8') as f:
            json.dump(resp.json(), f, ensure_ascii=False, indent=4)
    else :
        with open('data/sources/sherpa/errors_2023/errors.txt', 'a', encoding='utf-8') as g:
            g.write(myissn + ' - ' + str(resp.status_code) + '\n')
    if (((index/100) - int(index/100)) == 0) :
        print(index)
    time.sleep(1)

300
500
900
1100
1200
1400
1700
1800
1900
2200
2300
2700
3200
3800
3900
4200
4600
4700
5100
5300
5400
5800
6000
6200
6300
6400
6500
6700
6900
7000
7300
7500
7600
7700
7800
7900
8000
8400
8500
8900
9100
9200
9400
10000
10400
10600
11100
11700
12000
12200
12500
13400
13500
13700
14300
14400
15300
15400


In [13]:
# test p-ISSN
pubmed_medline_issn.loc[pubmed_medline_issn['ISSN-Print'].isna()]

Unnamed: 0,NlmUniqueID,Title,MedlineTA,Country,Place,Publisher,PublicationFirstYear,PublicationEndYear,Frequency,ISSN-Electronic,...,ISSN-Linking,Language,TitleContinuationYN,IndexingStartDate,CurrentlyIndexedYN,IndexOnlineYN,IndexingSubset,IndexingSelectedURL,ReportedMedlineYN,ISSN
3,101714112,A&A practice,A A Pract,United States,"[Philadelphia, PA]","Wolters Kluwer Health, Inc.",2018,,Biweekly,2575-3126,...,2575-3126,eng,Y,2018.0,Y,Y,IM,https://ovidsp.ovid.com/ovidweb.cgi?T=JS&MODE=...,Y,2575-3126
12,101223209,The AAPS journal,AAPS J,United States,"Arlington, Va., USA",American Association of Pharmaceutical Scientists,2004,,Four no. a year,1550-7416,...,1550-7416,eng,Y,2004.0,Y,Y,IM,https://link.springer.com/journal/12248,Y,1550-7416
14,100960111,AAPS PharmSciTech,AAPS PharmSciTech,United States,New York,Springer,2000,,Quarterly,1530-9932,...,1530-9932,eng,N,2000.0,Y,Y,IM,https://link.springer.com/journal/12249,Y,1530-9932
46,101729147,ACS applied bio materials,ACS Appl Bio Mater,United States,"Washington, DC",ACS Publications,2018,,Monthly,2576-6422,...,2576-6422,eng,N,2021.0,Y,Y,IM,https://pubs.acs.org/journal/aabmcb,Y,2576-6422
48,101654670,ACS biomaterials science & engineering,ACS Biomater Sci Eng,United States,"Washington, DC",American Chemical Society,2015,,Monthly,2373-9878,...,2373-9878,eng,N,2020.0,Y,Y,IM,https://pubs.acs.org/journal/abseba,Y,2373-9878
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
14874,101231645,Virology journal,Virol J,England,[London],BioMed Central,2004,,,1743-422X,...,1743-422X,eng,N,2004.0,Y,Y,IM,http://www.virologyj.com/,Y,1743-422X
14886,101509722,Viruses,Viruses,Switzerland,"Basel, Switzerland",MDPI,2009,,Quarterly,1999-4915,...,1999-4915,eng,N,2011.0,Y,Y,IM,http://www.mdpi.com/journal/viruses,Y,1999-4915
15048,9918227353306676,WIREs mechanisms of disease,WIREs Mech Dis,United States,"[Hoboken, NJ]","John Wiley & Sons, Inc.",2021,,Bimonthly,2692-9368,...,2692-9368,eng,Y,2021.0,Y,Y,IM,https://wires.onlinelibrary.wiley.com/journal/...,Y,2692-9368
15088,101266603,World journal of emergency surgery : WJES,World J Emerg Surg,England,London,BioMed Central,2006,,,1749-7922,...,1749-7922,eng,N,2017.0,Y,Y,IM,http://www.wjes.org/,Y,1749-7922


In [14]:
# download sherpa data for p-ISSN (in case of error in NLM data)
issns_import = pubmed_medline_issn.loc[pubmed_medline_issn['ISSN-Print'].notna()]
for index, row in issns_import.iterrows():
    myissn = row['ISSN-Print']
    # debug: print (myissn)
    # test d'existance du fichier avant le chargement de nouveau
    if not os.path.exists('data/sources/sherpa/data_2023/' + myissn + '.json'):
        searchurl = 'https://v2.sherpa.ac.uk/cgi/retrieve_by_id?item-type=publication&api-key=EEE6F146-678E-11EB-9C3A-202F3DE2659A&format=Json&identifier=' + myissn
        headers = {'Accept': 'application/json'}
        resp = requests.get(searchurl, headers=headers)
        # test du code pour éviter les erreurs 
        if (resp.status_code == 200):
            # export en json
            with open('data/sources/sherpa/data_2023/' + myissn + '.json', 'w', encoding='utf-8') as f:
                json.dump(resp.json(), f, ensure_ascii=False, indent=4)
        else :
            with open('data/sources/sherpa/errors_2023/errors_print.txt', 'a', encoding='utf-8') as g:
                g.write(myissn + ' - ' + str(resp.status_code) + '\n')
        if (((index/100) - int(index/100)) == 0) :
            print(index)
        time.sleep(1)

300
500
900
1100
1400
1700
1800
1900
2200
2300
2700
3200
3800
3900
4200
4600
4700
5100
5300
5400
5800
6000
6200
6300
6500
6700
6900
7300
7500
7600
7700
7800
7900
8000
8400
8500
8900
9100
9200
9400
10000
10400
10600
11100
11700
12000
12200
12500
13500
13700
14300
14400
15300


In [15]:
# exports
pubmed_medline_issn.to_csv('data/sources/nlm/lsi2023_medline_issns.tsv', sep='\t', encoding='utf-8', index=False)
pubmed_medline_issn.to_excel('data/sources/nlm/lsi2023_medline_issns.xlsx', index=False)