In [5]:
import requests
import xml.etree.ElementTree as ET

base_url = "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/"
api_url = base_url + "esearch.fcgi"
params = {
    "db": "pubmed",
    "retmode": "xml",
    "retmax": 100,  # Number of papers to retrieve (adjust as needed)
    "term": "Entyvio"  # Modify the search query to match your needs
}

response = requests.get(api_url, params=params)
if response.status_code == 200:
    xml_content = response.content
    root = ET.fromstring(xml_content)
    paper_ids = [id_node.text for id_node in root.findall(".//Id")]
    print("Retrieved paper IDs:", paper_ids)
else:
    print("Error occurred while retrieving paper IDs:", response.status_code)


Retrieved paper IDs: ['37352154', '37350775', '37349130', '37335733', '37322825', '37318737', '37315113', '37314124', '37305935', '37303967', '37300512', '37300328', '37289109', '37288829', '37287984', '37278369', '37274297', '37265220', '37265165', '37259387', '37254193', '37247641', '37246609', '37240501', '37239166', '37235748', '37232444', '37229320', '37227615', '37224287', '37221820', '37219360', '37216614', '37214561', '37214457', '37208197', '37199618', '37198111', '37191356', '37188381', '37176570', '37172505', '37172205', '37171478', '37170542', '37168636', '37168632', '37166016', '37164738', '37158585', '37150784', '37140705', '37124368', '37115969', '37115362', '37100708', '37100606', '37099011', '37084137', '37084088', '37074509', '37069838', '37063436', '37062627', '37057077', '29999729', '37053548', '37051622', '37048587', '37042978', '37042951', '37029786', '37010772', '36999101', '36998249', '36988594', '36986833', '36983432', '36982892', '36976548', '36966279', '36964

In [6]:
fetch_url = base_url + "elink.fcgi"
fetch_params = {
    "dbfrom": "pubmed",
    "db": "pmc",
    "linkname": "pubmed_pmc",
    "id": "36205507"  # Replace with the desired paper ID
}
fetch_response = requests.get(fetch_url, params=fetch_params)
if fetch_response.status_code == 200:
    xml_content = fetch_response.content
    root = ET.fromstring(xml_content)
    link_nodes = root.findall(".//Link")
    full_text_links = []
    for link_node in link_nodes:
        full_text_link = link_node.find("./Url")
        if full_text_link is not None:
            full_text_links.append(full_text_link.text)
    print("Retrieved full text links:", full_text_links)
else:
    print("Error occurred while retrieving full text links:", fetch_response.status_code)


Retrieved full text links: []


In [7]:
doi = "10.1234/example_doi"  # Replace with the actual DOI
headers = {"Accept": "application/vnd.citationstyles.csl+json"}
full_text_url = f"https://doi.org/{doi}"
response = requests.get(full_text_url, headers=headers)
if response.status_code == 200:
    # Process and store the retrieved full text content as needed
    full_text_content = response.text
    print("Retrieved full text for DOI:", doi)
else:
    print("Error occurred while retrieving full text:", response.status_code)

Error occurred while retrieving full text: 404


In [8]:
import requests

doi = "10.1093/crocol/otad031"  # Replace with the DOI of the article you want to retrieve
headers = {"Accept": "application/vnd.citationstyles.csl+json"}
full_text_url = f"https://doi.org/{doi}"
response = requests.get(full_text_url, headers=headers)
if response.status_code == 200:
    # Process and store the retrieved full text content as needed
    full_text_content = response.text
    print("Retrieved full text for DOI:", doi)
else:
    print("Error occurred while retrieving full text:", response.status_code)


Retrieved full text for DOI: 10.1093/crocol/otad031


In [45]:
full_text_content

'{"indexed":{"date-parts":[[2023,5,30]],"date-time":"2023-05-30T04:25:52Z","timestamp":1685420752760},"reference-count":0,"publisher":"Oxford University Press (OUP)","license":[{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"am","delay-in-days":0,"URL":"https:\\/\\/creativecommons.org\\/licenses\\/by-nc\\/4.0\\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"abstract":"<jats:title>Abstract<\\/jats:title>\\n               <jats:sec>\\n                  <jats:title>Background<\\/jats:title>\\n                  <jats:p>Primary and secondary non-response to Anti-Tumor Necrosis Factor (TNF) therapy is common in patients with ulcerative colitis (UC), yet limited research has compared the effectiveness of subsequent biological therapy.<\\/jats:p>\\n               <\\/jats:sec>\\n               <jats:sec>\\n                  <jats:title>Objective<\\/jats:title>\\n                  <jats:p>We sought to compa

In [28]:
from crossref.restful import Works

works = Works()

w1 = works.doi('10.1177/1756283X16668093')
w1['link'][0]['URL']


'http://journals.sagepub.com/doi/pdf/10.1177/1756283X16668093'