In [1]:
######################################
########## Library/Packages ##########
######################################

#!pip install feedparser

import pandas as pd
import urllib
import time
import feedparser

In [2]:
######################################
########## Data Frame Prep  ##########
######################################

API_Output = pd.DataFrame(columns = ["URL", "Title", "Published", "Updated", "Author", "Abstract"])


In [3]:
######################################
########## Calling from API ##########
######################################

# Base api query url
base_url = 'http://export.arxiv.org/api/query?';

# Search parameters
search_query = 'all:quantum%20computing'    # search for articles relating to quantum computing
start = 0                                   # start at the first result
total_results = 100                          # want # total results (suggested was 20)
results_per_iteration = 50                  # # of results at a time (suggested was 5)
wait_time = 3                               # number of seconds to wait beetween calls (suggested was 3)

print('Searching arXiv for: "%s" \n\n' % search_query)


#Looping Through Results
for i in range(start,total_results,results_per_iteration):    
    
    #Output Result #s
    print("Results %i - %i" % (i,i+results_per_iteration))
    
    #Query Term Using Inputs
    query = 'search_query=%s&start=%i&max_results=%i' % (search_query, i, results_per_iteration)
    
    #Request from ArXiv Using URL+Query to form request
    print('%s' % base_url+query)
    response = urllib.request.urlopen(base_url+query).read()
    
    #Parse the response using feedparser
    feed = feedparser.parse(response)

    # Run through each entry, and grab selected information
    for entry in feed.entries:
        API_Output = API_Output.append({"URL":entry.id,
                                        "Title":entry.title,
                                        "Published":entry.published[:10],
                                        "Updated":entry.updated[:10],
                                        "Author":entry.author, #Note: This is the FIRST Author only.
                                        "Abstract":entry.summary}, ignore_index=True)

    
    #Wait to re-call from API
    print('Wait %i Second(s)' % wait_time)
    time.sleep(wait_time)
    
# Exited For Loop
print("\n\nData Gathering Complete!")
display(API_Output.head(3))
display(API_Output.tail(3))

#Output into CSV
API_Output.to_csv('API_Output.csv',index=False)

Searching arXiv for: "all:quantum%20computing" 


Results 0 - 50
http://export.arxiv.org/api/query?search_query=all:quantum%20computing&start=0&max_results=50
Wait 3 Second(s)
Results 50 - 100
http://export.arxiv.org/api/query?search_query=all:quantum%20computing&start=50&max_results=50
Wait 3 Second(s)


Data Gathering Complete!


Unnamed: 0,URL,Title,Published,Updated,Author,Abstract
0,http://arxiv.org/abs/quant-ph/0003151v1,Unconventional Quantum Computing Devices,2000-03-31,2000-03-31,Seth Lloyd,This paper investigates a variety of unconvent...
1,http://arxiv.org/abs/2111.15352v2,Understanding Quantum Technologies,2021-11-24,2021-12-01,Olivier Ezratty,Understanding Quantum Technologies is a 836 pa...
2,http://arxiv.org/abs/1311.4939v1,Geometrical perspective on quantum states and ...,2013-11-20,2013-11-20,Zeqian Chen,We interpret quantum computing as a geometric ...


Unnamed: 0,URL,Title,Published,Updated,Author,Abstract
97,http://arxiv.org/abs/quant-ph/0302153v1,A prime factorization based on quantum dynamic...,2003-02-20,2003-02-20,Xijia Miao,In this paper it has been described how to use...
98,http://arxiv.org/abs/cond-mat/0102019v1,Theoretical issues in spin-based quantum dot q...,2001-02-01,2001-02-01,S. Das Sarma,We review our recent work addressing various t...
99,http://arxiv.org/abs/quant-ph/9806048v1,Quantum computation with linear optics,1998-06-14,1998-06-14,N. J. Cerf,We present a constructive method to translate ...


'git' is not recognized as an internal or external command,
operable program or batch file.
