In [3]:
import arxiv
import pandas as pd

search = arxiv.Search(
    # filter by containing "acl" in comment
    # cannot filter by "co:acl+2023"
    query = "co:acl",
    max_results = 2000,
    sort_by = arxiv.SortCriterion.SubmittedDate,
)

papers = []
for result in search.results():
    names = []
    for author in result.authors:
        names.append(author.name)
    authors = ", ".join(names)
    paper = [
        result.entry_id,
        result.updated,
        result.published,
        result.title,
        result.summary,
        result.comment,
        result.primary_category,
        authors,
    ]
    papers.append(paper)

In [4]:
len(papers)

2000

In [5]:
cols = ["entry_id", "updated", "published", "title", "summary", "comment", "primary_category", "authors",]

df = pd.DataFrame(papers, columns=cols)

In [6]:
df[df["comment"].str.contains("23")]

Unnamed: 0,entry_id,updated,published,title,summary,comment,primary_category,authors
1,http://arxiv.org/abs/2306.12907v1,2023-06-22 14:20:15+00:00,2023-06-22 14:20:15+00:00,xSIM++: An Improved Proxy to Bitext Mining Per...,We introduce a new proxy score for evaluating ...,The first two authors contributed equally; ACL...,cs.CL,"Mingda Chen, Kevin Heffernan, Onur Çelebi, Ale..."
2,http://arxiv.org/abs/2306.12619v1,2023-06-22 01:14:47+00:00,2023-06-22 01:14:47+00:00,Class-Incremental Learning based on Label Gene...,Despite the great success of pre-trained langu...,"12 pages, ACL 2023 Main Conference",cs.CL,"Yijia Shao, Yiduo Guo, Dongyan Zhao, Bing Liu"
3,http://arxiv.org/abs/2306.12581v1,2023-06-21 21:34:39+00:00,2023-06-21 21:34:39+00:00,Morphological Inflection with Phonological Fea...,Recent years have brought great advances into ...,"ACL 2023 main conference; 8 pages, 1 figure",cs.CL,"David Guriel, Omer Goldman, Reut Tsarfaty"
4,http://arxiv.org/abs/2306.12181v1,2023-06-21 11:24:41+00:00,2023-06-21 11:24:41+00:00,Feature Interactions Reveal Linguistic Structu...,We study feature interactions in the context o...,ACL Findings 2023,cs.CL,"Jaap Jumelet, Willem Zuidema"
5,http://arxiv.org/abs/2306.12146v1,2023-06-21 09:50:48+00:00,2023-06-21 09:50:48+00:00,Which Spurious Correlations Impact Reasoning i...,We present a human-in-the-loop dashboard tailo...,"7 pages, Accepted at ACL 2023: System Demonstr...",cs.CL,"Robin Chan, Afra Amini, Mennatallah El-Assady"
...,...,...,...,...,...,...,...,...
1584,http://arxiv.org/abs/2110.01176v3,2023-06-13 16:46:04+00:00,2021-10-04 03:59:15+00:00,Contextualized Semantic Distance between Highl...,Overlapping frequently occurs in paired texts ...,Accepted to ACL 2023 (findings),cs.CL,"Letian Peng, Zuchao Li, Hai Zhao"
1634,http://arxiv.org/abs/2108.11590v2,2023-05-04 20:22:25+00:00,2021-08-26 05:44:20+00:00,AVATAR: A Parallel Corpus for Java-Python Prog...,Program translation refers to migrating source...,Accepted to Findings of ACL 2023,cs.SE,"Wasi Uddin Ahmad, Md Golam Rahman Tushar, Saik..."
1741,http://arxiv.org/abs/2106.13213v1,2021-06-24 17:46:03+00:00,2021-06-24 17:46:03+00:00,Learning Language and Multimodal Privacy-Prese...,Mental health conditions remain underdiagnosed...,ACL 2021. arXiv admin note: substantial text o...,cs.LG,"Paul Pu Liang, Terrance Liu, Anna Cai, Michal ..."
1878,http://arxiv.org/abs/2106.02792v2,2021-06-21 00:30:45+00:00,2021-06-05 04:31:06+00:00,Weakly-Supervised Methods for Suicide Risk Ass...,Social media has become a valuable resource fo...,ACL 2021 short paper. Code is available at\n ...,cs.CL,"Chenghao Yang, Yudong Zhang, Smaranda Muresan"


In [7]:
# comment contains 23 but not 2023
df[df["comment"].str.contains("23") & ~df["comment"].str.contains("2023") ]

Unnamed: 0,entry_id,updated,published,title,summary,comment,primary_category,authors
114,http://arxiv.org/abs/2306.03723v1,2023-06-06 14:41:30+00:00,2023-06-06 14:41:30+00:00,Financial Numeric Extreme Labelling: A Dataset...,The U.S. Securities and Exchange Commission (S...,Accepted to ACL'23 Findings Paper,cs.CL,"Soumya Sharma, Subhendu Khatuya, Manjunath Heg..."
176,http://arxiv.org/abs/2306.01200v1,2023-06-01 23:27:49+00:00,2023-06-01 23:27:49+00:00,Multi-Dimensional Evaluation of Text Summariza...,Evaluation of natural language generation (NLG...,ACL Findings '23,cs.CL,"Sameer Jain, Vaishakh Keshava, Swarnashree Mys..."
234,http://arxiv.org/abs/2305.19228v1,2023-05-30 17:20:25+00:00,2023-05-30 17:20:25+00:00,Unsupervised Melody-to-Lyric Generation,Automatic melody-to-lyric generation is a task...,Accepted to ACL 23. arXiv admin note: substant...,cs.CL,"Yufei Tian, Anjali Narayan-Chen, Shereen Oraby..."
295,http://arxiv.org/abs/2306.00005v1,2023-05-27 17:25:13+00:00,2023-05-27 17:25:13+00:00,A Two-Stage Decoder for Efficient ICD Coding,Clinical notes in healthcare facilities are ta...,Accepted to ACL'23,cs.CL,"Thanh-Tung Nguyen, Viktor Schlegel, Abhinav Ka..."
373,http://arxiv.org/abs/2305.16641v1,2023-05-26 05:29:37+00:00,2023-05-26 05:29:37+00:00,Are Fairy Tales Fair? Analyzing Gender Bias in...,Social biases and stereotypes are embedded in ...,acl 23,cs.CL,"Paulina Toro Isaza, Guangxuan Xu, Akintoye Olo..."
383,http://arxiv.org/abs/2305.16559v1,2023-05-26 00:57:43+00:00,2023-05-26 00:57:43+00:00,Teamwork Is Not Always Good: An Empirical Stud...,Class-incremental learning (CIL) aims to devel...,"ACL'23 (Findings). 15 pages, 3 figures, 7 tables",cs.CL,"Minqian Liu, Lifu Huang"
418,http://arxiv.org/abs/2305.15597v1,2023-05-24 22:09:35+00:00,2023-05-24 22:09:35+00:00,Text-Augmented Open Knowledge Graph Completion...,The mission of open knowledge graph (KG) compl...,"18 pages, 11 figures, 8 tables. Accepted by AC...",cs.CL,"Pengcheng Jiang, Shivam Agarwal, Bowen Jin, Xu..."
432,http://arxiv.org/abs/2305.15182v2,2023-06-09 08:53:14+00:00,2023-05-24 14:14:08+00:00,HiTIN: Hierarchy-aware Tree Isomorphism Networ...,Hierarchical text classification (HTC) is a ch...,Accepted by ACL'23,cs.CL,"He Zhu, Chong Zhang, Junjie Huang, Junran Wu, ..."
452,http://arxiv.org/abs/2305.14618v1,2023-05-24 01:35:10+00:00,2023-05-24 01:35:10+00:00,Abductive Commonsense Reasoning Exploiting Mut...,Abductive reasoning aims to find plausible exp...,accepted at ACL'23,cs.CL,"Wenting Zhao, Justin T. Chiu, Claire Cardie, A..."
464,http://arxiv.org/abs/2305.13833v1,2023-05-23 08:53:33+00:00,2023-05-23 08:53:33+00:00,Reducing Sensitivity on Speaker Names for Text...,Changing speaker names consistently throughout...,findings of ACL'23,cs.CL,"Qi Jia, Haifeng Tang, Kenny Q. Zhu"


In [8]:
df_acl_23 = df[df["comment"].str.contains("23")].reset_index(drop=True)

In [9]:
df_acl_23.to_csv("arxiv_acl_2023.csv")