In [1]:
# prepare the key for openai and pubmed
import os

# E2B sandbox API
with open("e2b.key", "r") as f:
    E2B_API_KEY = f.read()
    os.environ["E2B_API_KEY"] = E2B_API_KEY

# OpenAI API key
with open("openai.key", "r") as f:
    OPENAI_API_KEY_GLOBAL = f.read()
    os.environ["OPENAI_API_KEY"] = OPENAI_API_KEY_GLOBAL

#  Pubmed API key
with open("pubmed.key", "r") as f:
    DEFAULT_PUBMED_API_KEY = f.read()
    os.environ["PUBMED_API_KEY"] = DEFAULT_PUBMED_API_KEY

# Study characteristics extraction

In [2]:
from trialmind.pubmed import pmid2biocxml, parse_bioc_xml

In [3]:
pmid_list = ['38514163',
 '38510282',
 '37913939',
 '38323364',
 '38212825',
 '37790460',
 '37525573',
 '37686569',
 '37827067',
 '37575835',
    ]
res = pmid2biocxml(pmid_list)
res = [parse_bioc_xml(r) for r in res]

In [4]:
# transform the parsed xml into paper content
papers = []
for parsed in res:
    paper_content = []
    for parsed_ in parsed["passage"]:
        paper_content.append(parsed_['content'])
    paper_content = "\n".join(paper_content)
    papers.append(paper_content)
papers

['',
 'Clinical Outcomes Among Immunotherapy-Treated Patients With Primary Cardiac Soft Tissue Sarcomas\nBackground\nPrimary cardiac soft tissue sarcomas (CSTS) affect young adults, with dismal outcomes.\nObjectives\nThe aim of this study was to investigate the clinical outcomes of patients with CSTS receiving immune checkpoint inhibitors (ICIs).\nMethods\nA retrospective, multi-institutional cohort study was conducted among patients with CSTS between 2015 and 2022. The patients were treated with ICI-based regimens. The Kaplan-Meier method was used to estimate overall survival (OS) and progression-free survival (PFS). Objective response rates were determined according to Response Evaluation Criteria in Solid Tumors version 1.1. Treatment-related adverse events were graded per the Common Terminology Criteria for Adverse Events version 5.0.\nResults\nAmong 24 patients with CSTS, 17 (70.8%) were White, and 13 (54.2%) were male. Eight patients (33.3%) had angiosarcoma. At the time of ICI t

In [6]:
from trialmind.api import StudyCharacteristicsExtraction
api = StudyCharacteristicsExtraction()
extracted = api.run(
    papers=papers,
    fields=api.DEFAULT_FIELDS,
    llm="openai-gpt-4o",
)

In [8]:
papers[0]


''

In [7]:
extracted[0]

[{'name': 'Study Name', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Study Type', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Study Year', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Location', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Phase', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Conditions', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Treatments', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Comparison', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Num Patients', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Mean Age', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Age Range', 'value': 'NP', 'source_id': [], 'cited_blocks': []}]

In [9]:
extracted[1]

[{'name': 'Study Name', 'value': 'NP', 'source_id': [], 'cited_blocks': []},
 {'name': 'Study Type',
  'value': 'observational study',
  'source_id': [2, 3, 26],
  'cited_blocks': ['Patient population\nThis study was based on an analysis of a retrospective, multicenter database. Data from 8 participating institutions in the United States (Supplemental TableÂ\xa01) were obtained and are currently housed at the Dana-Farber Cancer Institute. According to the Declaration of Helsinki, this retrospective study was covered by the Institutional Review Board review at the Dana-Farber Cancer Institute (protocol 21-329) and local Institutional Review Boards at participating sites.',
   'The introduction of immune checkpoint inhibitors (ICIs) has successfully shifted the treatment paradigm in oncology, and these agents have received regulatory approval for a broad spectrum of tumor types. In noncardiac sarcomas, clinical trials of ICIs have shown promising results, with response rates ranging betw