In [2]:
import urllib
import pandas as pd

In [17]:
import urllib.request
import feedparser

# Base api query url
base_url = 'http://export.arxiv.org/api/query?'

# Search parameters
search_query = 'all:electron'  # search for electron in all fields
start = 0                      # retrieve the first 5 results
max_results = 5

query = f'search_query={search_query}&start={start}&max_results={max_results}'

# Perform a GET request
with urllib.request.urlopen(base_url + query) as url:
    response = url.read()

# Parse the response using feedparser
feed = feedparser.parse(response)

# Print out feed information
print(f'Feed title: {feed.feed.title}')
print(f'Feed last updated: {feed.feed.updated}')

# Print opensearch metadata
print(f'totalResults for this query: {feed.feed.opensearch_totalresults}')
print(f'itemsPerPage for this query: {feed.feed.opensearch_itemsperpage}')
print(f'startIndex for this query: {feed.feed.opensearch_startindex}')

# Run through each entry, and print out information
for entry in feed.entries:
    print('\n--- e-print metadata ---')
    print(f'arxiv-id: {entry.id.split("/abs/")[-1]}')
    print(f'Published: {entry.published}')
    print(f'Title: {entry.title.strip()}')

    # Handle authors
    try:
        authors = ", ".join(author.name for author in entry.authors)
    except AttributeError:
        authors = entry.author  # fallback
    print(f'Authors: {authors}')

    # Links (abs + pdf)
    for link in entry.links:
        if link.rel == 'alternate':
            print(f'abs page link: {link.href}')
        elif getattr(link, "title", "") == 'pdf':
            print(f'pdf link: {link.href}')

    # Journal reference
    journal_ref = getattr(entry, 'arxiv_journal_ref', 'No journal ref found')
    print(f'Journal reference: {journal_ref}')

    # Comments
    comment = getattr(entry, 'arxiv_comment', 'No comment found')
    print(f'Comments: {comment}')

    # Categories
    if hasattr(entry, 'tags'):
        primary_category = entry.tags[0]['term']
        all_categories = [t['term'] for t in entry.tags]
    else:
        primary_category = "N/A"
        all_categories = []

    print(f'Primary Category: {primary_category}')
    print(f'All Categories: {", ".join(all_categories)}')

    # Abstract
    print(f'Abstract: {entry.summary.strip()}')


Feed title: ArXiv Query: search_query=all:electron&amp;id_list=&amp;start=0&amp;max_results=5
Feed last updated: 2025-10-02T00:00:00-04:00
totalResults for this query: 230459
itemsPerPage for this query: 5
startIndex for this query: 0

--- e-print metadata ---
arxiv-id: cond-mat/0102536v1
Published: 2001-02-28T20:12:09Z
Title: Impact of Electron-Electron Cusp on Configuration Interaction Energies
Authors: David Prendergast, M. Nolan, Claudia Filippi, Stephen Fahy, J. C. Greer
abs page link: http://arxiv.org/abs/cond-mat/0102536v1
pdf link: http://arxiv.org/pdf/cond-mat/0102536v1
Journal reference: J. Chem. Phys. 115, 1626 (2001)
Comments: 11 pages, 6 figures, 3 tables, LaTeX209, submitted to The Journal of
  Chemical Physics
Primary Category: cond-mat.str-el
All Categories: cond-mat.str-el
Abstract: The effect of the electron-electron cusp on the convergence of configuration
interaction (CI) wave functions is examined. By analogy with the
pseudopotential approach for electron-ion inter

In [None]:
import requests
import fitz  # PyMuPDF

arxiv_id = "cond-mat/0102536v1"
pdf_url = f"https://arxiv.org/pdf/{arxiv_id}.pdf"

# Download PDF
pdf_response = requests.get(pdf_url)
with open("paper.pdf", "wb") as f:
    f.write(pdf_response.content)

# Extract text
doc = fitz.open("paper.pdf")
text = ""
for page in doc:
    text += page.get_text()

print(text[:10000])


arXiv:cond-mat/0102536v1  [cond-mat.str-el]  28 Feb 2001
Impact of Electron-Electron Cusp on Conﬁguration Interaction Energies
David Prendergast,a) M. Nolan,b) Claudia Filippi,a) Stephen Fahy,a) and J.C. Greerb)
a)Department of Physics and b)NMRC, University College, Cork, Ireland
(November 26, 2024)
The eﬀect of the electron-electron cusp on the convergence of conﬁguration interaction (CI) wave
functions is examined. By analogy with the pseudopotential approach for electron-ion interactions,
an eﬀective electron-electron interaction is developed which closely reproduces the scattering of
the Coulomb interaction but is smooth and ﬁnite at zero electron-electron separation. The exact
many-electron wave function for this smooth eﬀective interaction has no cusp at zero electron-
electron separation. We perform CI and quantum Monte Carlo calculations for He and Be atoms,
both with the Coulomb electron-electron interaction and with the smooth eﬀective electron-electron
interaction. We ﬁnd t