In [1]:
from scholarly import scholarly

author_name = "Maciej Piasecki"
search_query = scholarly.search_author(author_name)
first_author_result = next(search_query)
first_author_result

{'container_type': 'Author',
 'filled': [],
 'source': <AuthorSource.SEARCH_AUTHOR_SNIPPETS: 'SEARCH_AUTHOR_SNIPPETS'>,
 'scholar_id': 'nU_W9XwAAAAJ',
 'url_picture': 'https://scholar.google.com/citations?view_op=medium_photo&user=nU_W9XwAAAAJ',
 'name': 'Maciej Piasecki',
 'affiliation': 'Wroclaw University of Science and Technology',
 'email_domain': '@pwr.wroc.pl',
 'interests': ['Computational Linguistics',
  'Natural Language Processing',
  'Human-Computer Interaction',
  'Artificial Intelligence',
  'Language Technology'],
 'citedby': 2951}

`fill` method retrieves more information 

In [2]:
author = scholarly.fill(first_author_result)
author

{'container_type': 'Author',
 'filled': ['basics',
  'indices',
  'counts',
  'coauthors',
  'publications',
  'public_access'],
 'source': <AuthorSource.SEARCH_AUTHOR_SNIPPETS: 'SEARCH_AUTHOR_SNIPPETS'>,
 'scholar_id': 'nU_W9XwAAAAJ',
 'url_picture': 'https://scholar.google.com/citations?view_op=medium_photo&user=nU_W9XwAAAAJ',
 'name': 'Maciej Piasecki',
 'affiliation': 'Wroclaw University of Science and Technology',
 'email_domain': '@pwr.wroc.pl',
 'interests': ['Computational Linguistics',
  'Natural Language Processing',
  'Human-Computer Interaction',
  'Artificial Intelligence',
  'Language Technology'],
 'citedby': 2951,
 'citedby5y': 1328,
 'hindex': 24,
 'hindex5y': 14,
 'i10index': 81,
 'i10index5y': 28,
 'cites_per_year': {2006: 18,
  2007: 50,
  2008: 89,
  2009: 95,
  2010: 112,
  2011: 118,
  2012: 131,
  2013: 186,
  2014: 154,
  2015: 123,
  2016: 153,
  2017: 154,
  2018: 172,
  2019: 195,
  2020: 130,
  2021: 200,
  2022: 115,
  2023: 343,
  2024: 337},
 'coauthors'

author's publications

In [3]:
len(author['publications'])

293

Here we only have some brief info about the given publication

In [4]:
first_publication = author['publications'][0]
first_publication

{'container_type': 'Publication',
 'source': <PublicationSource.AUTHOR_PUBLICATION_ENTRY: 'AUTHOR_PUBLICATION_ENTRY'>,
 'bib': {'title': 'ChatGPT: Jack of all trades, master of none',
  'pub_year': '2023',
  'citation': 'Information Fusion 99, 101861, 2023'},
 'filled': False,
 'author_pub_id': 'nU_W9XwAAAAJ:Aul-kAQHnToC',
 'num_citations': 427,
 'citedby_url': 'https://scholar.google.com/scholar?oi=bibs&hl=en&cites=2600515932282922845',
 'cites_id': ['2600515932282922845']}

In [5]:
first_publication_filled = scholarly.fill(first_publication)
first_publication_filled

{'container_type': 'Publication',
 'source': <PublicationSource.AUTHOR_PUBLICATION_ENTRY: 'AUTHOR_PUBLICATION_ENTRY'>,
 'bib': {'title': 'ChatGPT: Jack of all trades, master of none',
  'pub_year': 2023,
  'citation': 'Information Fusion 99, 101861, 2023',
  'author': 'Jan Kocoń and Igor Cichecki and Oliwier Kaszyca and Mateusz Kochanek and Dominika Szydło and Joanna Baran and Julita Bielaniewicz and Marcin Gruza and Arkadiusz Janz and Kamil Kanclerz and Anna Kocoń and Bartłomiej Koptyra and Wiktoria Mieleszczenko-Kowszewicz and Piotr Miłkowski and Marcin Oleksy and Maciej Piasecki and Łukasz Radliński and Konrad Wojtasik and Stanisław Woźniak and Przemysław Kazienko',
  'journal': 'Information Fusion',
  'volume': '99',
  'pages': '101861',
  'publisher': 'Elsevier',
  'abstract': 'OpenAI has released the Chat Generative Pre-trained Transformer (ChatGPT) and revolutionized the approach in artificial intelligence to human-model interaction. The first contact with the chatbot reveals it

Here we have multiple authors!

In [6]:
first_publication_filled['bib']['author']

'Jan Kocoń and Igor Cichecki and Oliwier Kaszyca and Mateusz Kochanek and Dominika Szydło and Joanna Baran and Julita Bielaniewicz and Marcin Gruza and Arkadiusz Janz and Kamil Kanclerz and Anna Kocoń and Bartłomiej Koptyra and Wiktoria Mieleszczenko-Kowszewicz and Piotr Miłkowski and Marcin Oleksy and Maciej Piasecki and Łukasz Radliński and Konrad Wojtasik and Stanisław Woźniak and Przemysław Kazienko'

The abstract is not full. 

In [7]:
first_publication_filled['bib']['abstract']

'OpenAI has released the Chat Generative Pre-trained Transformer (ChatGPT) and revolutionized the approach in artificial intelligence to human-model interaction. The first contact with the chatbot reveals its ability to provide detailed and precise answers in various areas. Several publications on ChatGPT evaluation test its effectiveness on well-known natural language processing (NLP) tasks. However, the existing studies are mostly non-automated and tested on a very limited scale. In this work, we examined ChatGPT’s capabilities on 25 diverse analytical NLP tasks, most of them subjective even to humans, such as sentiment analysis, emotion recognition, offensiveness, and stance detection. In contrast, the other tasks require more objective reasoning like word sense disambiguation, linguistic acceptability, and question answering. We also evaluated GPT-4 model on five selected subsets of NLP tasks. We …'

In [8]:
def get_author_publications(author_name):
    # 'affiliation' should be 'Wroclaw University of Science and Technology' or similiar
    search_query = scholarly.search_author(author_name)
    if not search_query:
        return None 
    first_author_result = next(search_query)
    author = scholarly.fill(first_author_result)
    return author['publications']

In [9]:
def structure_publications(publications):
    structured_publications = []
    for publication in publications:
        filled_pub = scholarly.fill(publication)
        if 'abstract' in filled_pub['bib']:
            structured_publications.append({'abstract' : filled_pub['bib']['abstract'], 'title': filled_pub['bib']['title'], 'author': filled_pub['bib']['author']})
        
    return structured_publications

In [10]:
mp_pubs = get_author_publications('Maciej Piasecki')
mp_structured_publications = structure_publications(mp_pubs)

In [11]:
mp_structured_publications[0]

{'abstract': 'OpenAI has released the Chat Generative Pre-trained Transformer (ChatGPT) and revolutionized the approach in artificial intelligence to human-model interaction. The first contact with the chatbot reveals its ability to provide detailed and precise answers in various areas. Several publications on ChatGPT evaluation test its effectiveness on well-known natural language processing (NLP) tasks. However, the existing studies are mostly non-automated and tested on a very limited scale. In this work, we examined ChatGPT’s capabilities on 25 diverse analytical NLP tasks, most of them subjective even to humans, such as sentiment analysis, emotion recognition, offensiveness, and stance detection. In contrast, the other tasks require more objective reasoning like word sense disambiguation, linguistic acceptability, and question answering. We also evaluated GPT-4 model on five selected subsets of NLP tasks. We …',
 'title': 'ChatGPT: Jack of all trades, master of none',
 'author': '

In [23]:
from scholarly import ProxyGenerator

pg = ProxyGenerator()
pg.FreeProxies()
scholarly.use_proxy(pg)

# Using proxy to prevent the IP from being blocked
# Searching authors by organization, works for authors added to the organization but doesn't include everyone
organization_id = 6200813508511872715
author_names = list(scholarly.search_author_by_organization(organization_id))

In [24]:
len(author_names)

508

In [29]:
author_names[0]

{'container_type': 'Author',
 'filled': [],
 'source': <AuthorSource.SEARCH_AUTHOR_SNIPPETS: 'SEARCH_AUTHOR_SNIPPETS'>,
 'scholar_id': 'hnzxVlgAAAAJ',
 'url_picture': 'https://scholar.google.com/citations?view_op=medium_photo&user=hnzxVlgAAAAJ',
 'name': 'Rafał Weron',
 'affiliation': 'Wrocław University of Science and Technology (Politechnika Wrocławska), Poland',
 'email_domain': '@pwr.edu.pl',
 'interests': ['Energy Forecasting',
  'Energy Analytics',
  'Energy Economics',
  'Computational Finance',
  'Energy Finance'],
 'citedby': 17276}

In [30]:
author_filled = scholarly.fill(author_names[0])

Publications are sorted according to publications in ascending order

In [31]:
author_filled

{'container_type': 'Author',
 'filled': ['basics',
  'indices',
  'counts',
  'coauthors',
  'publications',
  'public_access'],
 'source': <AuthorSource.SEARCH_AUTHOR_SNIPPETS: 'SEARCH_AUTHOR_SNIPPETS'>,
 'scholar_id': 'hnzxVlgAAAAJ',
 'url_picture': 'https://scholar.google.com/citations?view_op=medium_photo&user=hnzxVlgAAAAJ',
 'name': 'Rafał Weron',
 'affiliation': 'Wrocław University of Science and Technology (Politechnika Wrocławska), Poland',
 'email_domain': '@pwr.edu.pl',
 'interests': ['Energy Forecasting',
  'Energy Analytics',
  'Energy Economics',
  'Computational Finance',
  'Energy Finance'],
 'citedby': 17276,
 'organization': 6200813508511872715,
 'homepage': 'https://p.wz.pwr.edu.pl/~weron.rafal/',
 'citedby5y': 8402,
 'hindex': 62,
 'hindex5y': 45,
 'i10index': 133,
 'i10index5y': 95,
 'cites_per_year': {2002: 61,
  2003: 102,
  2004: 203,
  2005: 197,
  2006: 210,
  2007: 257,
  2008: 321,
  2009: 359,
  2010: 448,
  2011: 444,
  2012: 571,
  2013: 742,
  2014: 690,


In [32]:
scholarly.fill(author_filled['publications'][0])

{'container_type': 'Publication',
 'source': <PublicationSource.AUTHOR_PUBLICATION_ENTRY: 'AUTHOR_PUBLICATION_ENTRY'>,
 'bib': {'title': 'Electricity price forecasting: A review of the state-of-the-art with a look into the future',
  'pub_year': 2014,
  'citation': 'International journal of forecasting 30 (4), 1030-1081, 2014',
  'author': 'Rafał Weron',
  'volume': '30',
  'number': '4',
  'pages': '1030-1081',
  'publisher': 'Elsevier',
  'abstract': 'A variety of methods and ideas have been tried for electricity price forecasting (EPF) over the last 15 years, with varying degrees of success. This review article aims to explain the complexity of available solutions, their strengths and weaknesses, and the opportunities and threats that the forecasting tools offer or that may be encountered. The paper also looks ahead and speculates on the directions EPF will or should take in the next decade or so. In particular, it postulates the need for objective comparative EPF studies involving 