# Description

In this paper, I will download list of accepted paper from DBLP using DBLP api.

In [56]:
import os 
import numpy as np
import pandas as pd
import json
from typing import List, Tuple, Dict
import requests
import xml.etree.ElementTree as ET

In [51]:
LIST_CONF_NAME = ['mlsys']

In [61]:


def fetch_mlsys_xml(conf_name:str, year:int) -> bytes:
    """
    Fetch the XML data for the specified conference and year.
    """
    url = f"https://dblp.org/db/conf/{conf_name}/{conf_name}{year}.xml"
    resp = requests.get(url)
    resp.raise_for_status()
    return resp.content


def parse_mlsys_xml(xml_string: bytes) -> List[Dict]:
    root = ET.fromstring(xml_string)
    list_papers = []

    for r in root.findall(".//r"):
        inproc = r.find("inproceedings")
        if inproc is not None:
            title = inproc.findtext("title", default="").strip()
            authors = [a.text for a in inproc.findall("author")]
            url = inproc.findtext("ee", default="")
            year = inproc.findtext("year", default="")

            list_papers.append({
                "title": title,
                "authors": authors,
                "year": year,
                "url": url
            })
    return list_papers

In [62]:
conf_name = "mlsys"
year = 2023

xml_data = fetch_mlsys_xml(conf_name, year)
print(xml_data)

b'<bht key="db/conf/mlsys/mlsys2023.bht" title="MLSys 2023"> \n<h1>6th <ref href="db/conf/mlsys/index.html">MLSys</ref> 2023:\nMiami, FL, USA</h1> <dblpcites><r><proceedings key="conf/mlsys/2023" mdate="2024-06-28">\n<editor pid="s/DXSong">Dawn Song</editor>\n<editor pid="07/3119">Michael Carbin</editor>\n<editor pid="94/8023-1">Tianqi Chen 0001</editor>\n<title>Proceedings of the Sixth Conference on Machine Learning and Systems, MLSys 2023, Miami, FL, USA, June 4-8, 2023</title>\n<booktitle>MLSys</booktitle>\n<publisher>mlsys.org</publisher>\n<year>2023</year>\n<ee type="oa">https://proceedings.mlsys.org/book/2023</ee>\n<url>db/conf/mlsys/mlsys2023.html</url>\n</proceedings>\n</r>\n<r style="ee"><inproceedings key="conf/mlsys/KwonNSYMZSCZVBM23" mdate="2024-06-28">\n<author pid="203/0006">Hyoukjun Kwon</author>\n<author pid="126/3171">Krishnakumar Nair</author>\n<author pid="334/0541">Jamin Seo</author>\n<author pid="314/7067">Jason Yik</author>\n<author pid="68/6394">Debabrata Mohapat

In [63]:
list_papers = parse_mlsys_xml(xml_data)

for paper in list_papers:
    print(f"Title: {paper['title']}")
    print(f"Authors: {', '.join(paper['authors'])}")
    print(f"Year: {paper['year']}")
    print(f"URL: {paper['url']}")
    print("-" * 60)

Title: XRBench: An Extended Reality (XR) Machine Learning Benchmark Suite for the Metaverse.
Authors: Hyoukjun Kwon, Krishnakumar Nair, Jamin Seo, Jason Yik, Debabrata Mohapatra, Dongyuan Zhan, Jinook Song, Peter Capak, Peizhao Zhang, Peter Vajda, Colby R. Banbury, Mark Mazumder, Liangzhen Lai, Ashish Sirasao, Tushar Krishna, Harshit Khaitan, Vikas Chandra, Vijay Janapa Reddi
Year: 2023
URL: https://proceedings.mlsys.org/paper_files/paper/2023/hash/07b7c2f8a6978e376f9656d69619bfbb-Abstract-mlsys2023.html
------------------------------------------------------------
Title: FLINT: A Platform for Federated Learning Integration.
Authors: Ewen Wang, Boyi Chen, Mosharaf Chowdhury, Ajay Kannan, Franco Liang
Year: 2023
URL: https://proceedings.mlsys.org/paper_files/paper/2023/hash/0a1603bfce9502551ad89906515b5941-Abstract-mlsys2023.html
------------------------------------------------------------
Title: Practical Edge Kernels for Integer-Only Vision Transformers Under Post-training Quantization