## Notebook to test OpenAlex
#### An open and comprehensive catalog of scholarly papers, authors, and institutions.

In [1]:
# install necessary packages
!pip install pyalex



In [3]:
# import packages
from pyalex import Works, Authors, Sources, Institutions, Concepts, Publishers, Funders
import polars as pl

In [4]:
# Set the config widths to show more text in dataframes
pl.Config.set_ascii_tables()
pl.Config.set_tbl_width_chars(128)
pl.Config.set_fmt_str_lengths(64)

polars.config.Config

In [6]:
# grab random sources from open-alex
Sources().random()

{'id': 'https://openalex.org/S63040059',
 'issn_l': '1551-7144',
 'issn': ['1551-7144', '1559-2030'],
 'display_name': 'Contemporary Clinical Trials',
 'host_organization': 'https://openalex.org/P4310320990',
 'host_organization_name': 'Elsevier BV',
 'host_organization_lineage': ['https://openalex.org/P4310320990'],
 'works_count': 3116,
 'cited_by_count': 50118,
 'summary_stats': {'2yr_mean_citedness': 2.2018518518518517,
  'h_index': 77,
  'i10_index': 1338},
 'is_oa': False,
 'is_in_doaj': False,
 'ids': {'openalex': 'https://openalex.org/S63040059',
  'issn_l': '1551-7144',
  'issn': ['1551-7144', '1559-2030'],
  'mag': '63040059',
  'wikidata': 'https://www.wikidata.org/entity/Q5164971'},
 'homepage_url': 'https://www.journals.elsevier.com/contemporary-clinical-trials',
 'apc_prices': None,
 'apc_usd': None,
 'country_code': 'US',
 'societies': [],
 'alternate_titles': ['Contemp clin trials 4'],
 'abbreviated_title': None,
 'type': 'journal',
 'x_concepts': [{'id': 'https://opena

In [7]:
# Filter works on the current year
works = pl.DataFrame(Works().filter(publication_year=2023).select(["id", "title", "display_name", "publication_date","id","doi"]).get())

# Sort the works by publish data
works.sort(by="publication_date", descending=True)

id,title,display_name,publication_date,doi
str,str,str,str,str
"""https://openalex.org/W4291783855""","""Dematiaceous Hyphomycetes""","""Dematiaceous Hyphomycetes""","""2023-07-01""","""https://doi.org/10.1079/9780851986180.0000"""
"""https://openalex.org/W4362597599""","""Journal of Lightwave Technology""","""Journal of Lightwave Technology""","""2023-06-19""","""https://doi.org/10.1109/jlt.50"""
"""https://openalex.org/W4212930147""","""IEEE Journal of Selected Topics in Quantum Electronics""","""IEEE Journal of Selected Topics in Quantum Electronics""","""2023-06-13""","""https://doi.org/10.1109/jstqe.2944"""
"""https://openalex.org/W2081899208""","""Flatland: A Romance of Many Dimensions""","""Flatland: A Romance of Many Dimensions""","""2023-05-23""","""https://doi.org/10.4324/9781003056355-4"""
"""https://openalex.org/W1541215049""","""An Introduction to Visual Culture""","""An Introduction to Visual Culture""","""2023-05-02""","""https://doi.org/10.4324/9780429280238"""
"""https://openalex.org/W4200178834""","""International Journal of Pharmaceutical Sciences and Research""","""International Journal of Pharmaceutical Sciences and Research""","""2023-05-02""","""https://doi.org/10.13040/ijpsr.0975-8232"""
"""https://openalex.org/W304830213""","""The Reproduction of Mothering""","""The Reproduction of Mothering""","""2023-04-28""","""https://doi.org/10.2307/jj.2373318"""
"""https://openalex.org/W170545881""","""Patients and Healers in the Context of Culture""","""Patients and Healers in the Context of Culture""","""2023-04-28""","""https://doi.org/10.2307/jj.2711689"""
"""https://openalex.org/W2059517889""","""Toward a Rational Society""","""Toward a Rational Society""","""2023-04-28""","""https://doi.org/10.4324/9781003320609-36"""
"""https://openalex.org/W3108524584""","""Language As Symbolic Action""","""Language As Symbolic Action""","""2023-04-28""","""https://doi.org/10.2307/jj.2711556"""


In [9]:
# Get a list of publishers
pubs = Publishers().get()

def extract_item(list_of_dicts, key):
    items = []
    for dictionary in list_of_dicts:
        if key in dictionary:
            items.append(dictionary[key])
    return items

result = extract_item(pubs, 'display_name')
print(result)

['Elsevier BV', 'Springer Nature', 'Wiley', 'Springer Science+Business Media', 'Wiley-Blackwell', 'Taylor & Francis', 'University of Oxford', 'Oxford University Press', 'SAGE Publishing', 'Wolters Kluwer', 'Lippincott Williams & Wilkins', 'University of Cambridge', 'Cambridge University Press', 'American Chemical Society', 'Institute of Electrical and Electronics Engineers', 'Nature Portfolio', 'Institute of Physics', 'IOP Publishing', 'MDPI', 'BMJ', 'American Institute of Physics', 'De Gruyter', 'Thieme Medical Publishers (Germany)', 'Royal Society of Chemistry', 'American Physical Society']


In [12]:
Works()["W4313531093"]


{'id': 'https://openalex.org/W4313531093',
 'doi': 'https://doi.org/10.1016/j.cell.2022.11.001',
 'title': 'Hallmarks of aging: An expanding universe',
 'display_name': 'Hallmarks of aging: An expanding universe',
 'publication_year': 2023,
 'publication_date': '2023-01-01',
 'ids': {'openalex': 'https://openalex.org/W4313531093',
  'doi': 'https://doi.org/10.1016/j.cell.2022.11.001',
  'pmid': 'https://pubmed.ncbi.nlm.nih.gov/36599349'},
 'language': 'en',
 'primary_location': {'is_oa': False,
  'landing_page_url': 'https://doi.org/10.1016/j.cell.2022.11.001',
  'pdf_url': None,
  'source': {'id': 'https://openalex.org/S110447773',
   'display_name': 'Cell',
   'issn_l': '0092-8674',
   'issn': ['0092-8674', '1097-4172'],
   'is_oa': False,
   'is_in_doaj': False,
   'host_organization': 'https://openalex.org/P4310315673',
   'host_organization_name': 'Cell Press',
   'host_organization_lineage': ['https://openalex.org/P4310320990',
    'https://openalex.org/P4310315673'],
   'host_or