In [11]:
## ENTREZ, import modules
from Bio import Entrez

In [13]:
#help(Entrez)

Help on package Bio.Entrez in Bio:

NAME
    Bio.Entrez - Provides code to access NCBI over the WWW.

DESCRIPTION
    The main Entrez web page is available at:
    http://www.ncbi.nlm.nih.gov/Entrez/

    Entrez Programming Utilities web page is available at:
    http://www.ncbi.nlm.nih.gov/books/NBK25501/

    This module provides a number of functions like ``efetch`` (short for
    Entrez Fetch) which will return the data as a handle object. This is
    a standard interface used in Python for reading data from a file, or
    in this case a remote network connection, and provides methods like
    ``.read()`` or offers iteration over the contents line by line. See
    also "What the heck is a handle?" in the Biopython Tutorial and
    Cookbook: http://biopython.org/DIST/docs/tutorial/Tutorial.html
    http://biopython.org/DIST/docs/tutorial/Tutorial.pdf
    The handle returned by these functions can be either in text mode or
    in binary mode, depending on the data requested and the r

In [17]:
#To access NCBI Entrez programming utilities, type:
Entrez.email = "datacyclopes@gmail.com"

In [19]:
handle = Entrez.einfo()
record = Entrez.read(handle)
record["DbList"]

['pubmed', 'protein', 'nuccore', 'ipg', 'nucleotide', 'structure', 'genome', 'annotinfo', 'assembly', 'bioproject', 'biosample', 'blastdbinfo', 'books', 'cdd', 'clinvar', 'gap', 'gapplus', 'grasp', 'dbvar', 'gene', 'gds', 'geoprofiles', 'medgen', 'mesh', 'nlmcatalog', 'omim', 'orgtrack', 'pmc', 'popset', 'proteinclusters', 'pcassay', 'protfam', 'pccompound', 'pcsubstance', 'seqannot', 'snp', 'sra', 'taxonomy', 'biocollections', 'gtr']

In [21]:
#PUBMED
handle = Entrez.einfo(db="pubmed")
record = Entrez.read(handle)
record["DbInfo"]["Description"]

'PubMed bibliographic record'

In [23]:
record["DbInfo"]["Count"]

'37733308'

In [30]:
handle = Entrez.esearch(db="pubmed", term="cybernetics")
record = Entrez.read(handle)
record["IdList"]

['39264232', '39258649', '39246299', '39241843', '39237206', '39233507', '39221376', '39210956', '39211574', '39198641', '39196465', '39194422', '39182722', '39176945', '39175607', '39160074', '39158305', '39151232', '39148556', '39147947']

In [34]:
handle = Entrez.esummary(db="pubmed", id="39175607, 39258649")
records = Entrez.parse(handle)

for record in records:
    print(record["AuthorList"], record["Title"], record["PubDate"], record["FullJournalName"])

['Wheeler L', 'Worrell SE', 'Balzekas I', 'Bilderbeek J', 'Hermes D', 'Croarkin P', 'Messina S', 'Van Gompel J', 'Miller KJ', 'Kremen V', 'Worrell GA'] Case report: Bridging limbic network epilepsy with psychiatric, memory, and sleep comorbidities: case illustrations of reversible psychosis symptoms during continuous, high-frequency ANT-DBS. 2024 Frontiers in network physiology
['Blay EA', 'Piqueira JRC'] The Emergence of Edgar Morin's Complex Thinking. 2024 Anais da Academia Brasileira de Ciencias


In [36]:
handle = Entrez.efetch(db="pubmed", id="39147947")
print(handle.read())

b'<?xml version="1.0" ?>\n<!DOCTYPE PubmedArticleSet PUBLIC "-//NLM//DTD PubMedArticle, 1st January 2024//EN" "https://dtd.nlm.nih.gov/ncbi/pubmed/out/pubmed_240101.dtd">\n<PubmedArticleSet>\n<PubmedArticle><MedlineCitation Status="Publisher" Owner="NLM"><PMID Version="1">39147947</PMID><DateRevised><Year>2024</Year><Month>08</Month><Day>15</Day></DateRevised><Article PubModel="Print-Electronic"><Journal><ISSN IssnType="Electronic">1554-3528</ISSN><JournalIssue CitedMedium="Internet"><PubDate><Year>2024</Year><Month>Aug</Month><Day>15</Day></PubDate></JournalIssue><Title>Behavior research methods</Title><ISOAbbreviation>Behav Res Methods</ISOAbbreviation></Journal><ArticleTitle>A tutorial on open-source large language models for behavioral science.</ArticleTitle><ELocationID EIdType="doi" ValidYN="Y">10.3758/s13428-024-02455-8</ELocationID><Abstract><AbstractText>Large language models (LLMs) have the potential to revolutionize behavioral science by accelerating and improving the resear