In [2]:
from Bio import Entrez

Entrez.email = "basemal.alqusaimi@gmail.com"

# Search PubMed for sepsis biomarkers
query = "sepsis AND biomarker"

handle = Entrez.esearch(
    db="pubmed",
    term=query,
    retmax=10  # first 10 papers only
)

results = Entrez.read(handle)
handle.close()

pmid_list = results["IdList"]

print("Query:", query)
print("Number of results found:", results["Count"])
print("First 10 PMIDs:", pmid_list)


Query: sepsis AND biomarker
Number of results found: 15786
First 10 PMIDs: ['41676092', '41676054', '41674606', '41674120', '41672594', '41670654', '41669529', '41669126', '41668768', '41668763']


In [3]:
from Bio import Medline

# Fetch the details for those PMIDs
handle = Entrez.efetch(
    db="pubmed",
    id=",".join(pmid_list),
    rettype="medline",
    retmode="text"
)

records = list(Medline.parse(handle))
handle.close()

print("Downloaded records:", len(records))

# Print the first abstract
first = records[0]

print("\nTITLE:\n", first.get("TI", "?"))
print("\nYEAR:\n", first.get("DP", "?"))
print("\nABSTRACT (first 500 chars):\n", first.get("AB", "")[:500])


Downloaded records: 10

TITLE:
 The endothelial activation and stress index as a predictor of 28-day mortality in pulmonary sepsis: a retrospective two-cohort analysis.

YEAR:
 2026

ABSTRACT (first 500 chars):
 BACKGROUND: The Endothelial Activation and Stress Index (EASIX) is an emerging biomarker that serves as a straightforward and objective measure of systemic endothelial dysfunction and critical illness severity. This study aims to evaluate the prognostic value of EASIX for 28-day mortality in patients with pulmonary sepsis. MATERIALS AND METHODS: This retrospective study utilised a two-cohort design. The internal cohort was derived from MIMIC-IV; an external cohort was derived from a tertiary hos


In [4]:
import pandas as pd

papers = []

for r in records:
    papers.append({
        "pmid": r.get("PMID", ""),
        "title": r.get("TI", ""),
        "year": r.get("DP", "")[:4],
        "abstract": r.get("AB", "")
    })

df = pd.DataFrame(papers)

print(df.head())
print("\nShape:", df.shape)


       pmid                                              title  year  \
0  41676092  The endothelial activation and stress index as...  2026   
1  41676054  Use of LVAD HeartMate 3 and Impella RP in the ...  2026   
2  41674606  Rapid Detection of Inter-alpha Inhibitor Prote...  2026   
3  41674120  Interpreting peripheral oxygen saturation vari...  2026   
4  41672594  Phase 1 open-label study of ASP9801, an oncoly...  2026   

                                            abstract  
0  BACKGROUND: The Endothelial Activation and Str...  
1  Heart failure (HF) is a leading cause of morbi...  
2  Inter-alpha Inhibitor Proteins (IAIP) are seri...  
3  Peripheral oxygen saturation ( SpO2 ) exhibits...  
4  PURPOSE: ASP9801, an oncolytic virus encoding ...  

Shape: (10, 4)


In [5]:
df.to_csv("../data/sepsis_sample_10.csv", index=False)

print("✅ Saved to data/sepsis_sample_10.csv")


✅ Saved to data/sepsis_sample_10.csv
