# Sample codes to interact with the Scholarly toolbox


## If Scholarly is not installed, first get it from GH

In [None]:
# check if the scholarly module is installed, if not install it from
# pip3 install -U git+https://github.com/scholarly-python-package/scholarly.git

import importlib
schoarly_loader = importlib.util.find_spec('scholarly')
found = schoarly_loader is not None
if not found:
    import pip
    pip.main(['install', '-U', 'git+https://github.com/scholarly-python-package/scholarly.git'])

from scholarly import scholarly
import pandas as pd

## Experiment with Scholarly

In [34]:
from scholarly import scholarly
import pandas as pd

dataset = "ds003374"  # dataset to search for
# num_cites = scholarly.search_pubs(dataset)
search_query = scholarly.search_pubs(dataset)

In [36]:
search_query.total_results

4

In [35]:
pub_list = []
for s in search_query:
    print(scholarly.fill(s))

{'container_type': 'Publication', 'source': <PublicationSource.PUBLICATION_SEARCH_SNIPPET: 'PUBLICATION_SEARCH_SNIPPET'>, 'bib': {'title': 'Dataset of spiking and LFP activity invasively recorded in the human amygdala during aversive dynamic stimuli', 'author': 'Fedele, Tommaso and Boran, Ece and Chirkov, Valerii and Hilfiker, Peter and Grunwald, Thomas and Stieglitz, Lennart and Jokeit, Hennric and Sarnthein, Johannes', 'pub_year': '2021', 'venue': 'Scientific data', 'abstract': 'We present an electrophysiological dataset collected from the amygdalae of nine participants  attending a visual dynamic stimulation of emotional aversive content. The participants', 'publisher': 'Nature Publishing Group UK London', 'pages': '9', 'number': '1', 'volume': '8', 'journal': 'Scientific data', 'pub_type': 'article', 'bib_id': 'fedele2021dataset'}, 'filled': True, 'gsrank': 1, 'pub_url': 'https://www.nature.com/articles/s41597-020-00790-x', 'author_id': ['', '', 'XRumrPwAAAAJ', '', ''], 'url_schola

In [22]:
filled_pub = scholarly.fill(pub, sections=['venue'])

In [23]:
filled_pub

{'container_type': 'Publication',
 'source': <PublicationSource.PUBLICATION_SEARCH_SNIPPET: 'PUBLICATION_SEARCH_SNIPPET'>,
 'bib': {'title': 'Dataset of spiking and LFP activity invasively recorded in the human amygdala during aversive dynamic stimuli',
  'author': 'Fedele, Tommaso and Boran, Ece and Chirkov, Valerii and Hilfiker, Peter and Grunwald, Thomas and Stieglitz, Lennart and Jokeit, Hennric and Sarnthein, Johannes',
  'pub_year': '2021',
  'venue': 'Scientific data',
  'abstract': 'We present an electrophysiological dataset collected from the amygdalae of nine participants  attending a visual dynamic stimulation of emotional aversive content. The participants',
  'publisher': 'Nature Publishing Group UK London',
  'pages': '9',
  'number': '1',
  'volume': '8',
  'journal': 'Scientific data',
  'pub_type': 'article',
  'bib_id': 'fedele2021dataset'},
 'filled': True,
 'gsrank': 1,
 'pub_url': 'https://www.nature.com/articles/s41597-020-00790-x',
 'author_id': ['', '', 'XRumrPw

In [1]:
from scholarly import scholarly
from scholarly import ProxyGenerator
pg = ProxyGenerator()
        # This is a PAID API key specific to the NEMAR project, please do NOT share
success = pg.ScraperAPI("2b1a9b9f4327a5bec275d0261231886b")

In [6]:
search_query = scholarly.search_pubs('ds000117')

In [7]:
next(search_query)

{'container_type': 'Publication',
 'source': <PublicationSource.PUBLICATION_SEARCH_SNIPPET: 'PUBLICATION_SEARCH_SNIPPET'>,
 'bib': {'title': 'A reproducible MEG/EEG group study with the MNE software: recommendations, quality assessments, and good practices',
  'author': ['M Jas', 'E Larson', 'DA Engemann'],
  'pub_year': '2018',
  'venue': 'Frontiers in …',
  'abstract': 'Cognitive neuroscience questions are commonly tested with experiments that involve a cohort  of subjects. The cohort can consist of a handful of subjects for small studies to hundreds'},
 'filled': False,
 'gsrank': 1,
 'pub_url': 'https://www.frontiersin.org/articles/10.3389/fnins.2018.00530/full',
 'author_id': ['YIi1T7IAAAAJ', '87KLuLUAAAAJ', 'ombAzhMAAAAJ'],
 'url_scholarbib': '/scholar?hl=en&q=info:HCW-atpSAb4J:scholar.google.com/&output=cite&scirp=0&hl=en',
 'url_add_sclib': '/citations?hl=en&xsrf=&continue=/scholar%3Fq%3Dds000117%26hl%3Den%26as_sdt%3D0,33&citilm=1&update_op=library_add&info=HCW-atpSAb4J&ei=7_i5

## Sample script to use `getCitations` module to retrieve citation number and citation details

In [None]:
import getCitations
dataset = "ds003374"

# Number of Citations
citation_nums = getCitations.get_citation_numbers(dataset)

# Citation Details
if citation_nums != 0:
    citations = getCitations.get_citations(dataset, citation_nums)

print(citations.keys())

In [None]:
citations

## Sample commands to save the citations into a Pickle or CSV

In [None]:
citations.to_pickle("citations/"+dataset+".pkl")

In [5]:
import pandas as pd
loaded_cites = pd.read_pickle("citations/ds003374.pkl")

In [None]:
loaded_cites.to_excel("citations/ds000117.xlsx")

In [6]:
loaded_cites

Unnamed: 0,title,author,venue,year,url,cited_by,bib
0,Dataset of spiking and LFP activity invasively...,"[T Fedele, E Boran, V Chirkov, P Hilfiker, T G...",Scientific data,2021.0,https://www.nature.com/articles/s41597-020-007...,6,{'title': 'Dataset of spiking and LFP activity...
1,Open multimodal iEEG-fMRI dataset from natural...,"[J Berezutskaya, MJ Vansteensel, EJ Aarnoutse]",Scientific Data,2022.0,https://www.nature.com/articles/s41597-022-011...,11,{'title': 'Open multimodal iEEG-fMRI dataset f...
2,Epileptic high-frequency oscillations in intra...,"[E Boran, L Stieglitz, J Sarnthein]",Frontiers in Human Neuroscience,2021.0,https://www.frontiersin.org/articles/10.3389/f...,8,{'title': 'Epileptic high-frequency oscillatio...
3,Dataset of spiking and LFP activity invasively...,"[L Stieglitz, H Jokeit, J Sarnthein]",,,,0,{'title': 'Dataset of spiking and LFP activity...


In [8]:
loaded_cites['title'][0]

'Dataset of spiking and LFP activity invasively recorded in the human amygdala during aversive dynamic stimuli'