In [1]:
from eldar import Query
import bibtexparser
import pandas as pd

In [2]:
!pwd

/Volumes/ssd/01-ckj-postdoc/LLM-CCR/boolean-search


In [3]:
with open('anthology+abstracts.bib') as bib_file:
    bib_db = bibtexparser.load(bib_file)

In [4]:
df = pd.DataFrame(columns=['title', 'author', 'booktitle', 'year', 'url', 'abstract'])

In [5]:
print(f"Number of items: {len(bib_db.entries)}") # hasan et al.: 46079

Number of items: 97446


In [6]:
for index, bibitem in enumerate(bib_db.entries):
    title = bibitem.get('title', "")
    author = bibitem.get('author', "")
    booktitle = bibitem.get('booktitle', "")
    year = bibitem.get('year', "")
    url = bibitem.get('url', "")
    abstract = bibitem.get('abstract', "")

    df.loc[index, 'title'] = title
    df.loc[index, 'author'] = author
    df.loc[index, 'booktitle'] = booktitle
    df.loc[index, 'year'] = year
    df.loc[index, 'url'] = url
    df.loc[index, 'abstract'] = abstract

In [10]:
df['title-abstract'] = df['title'].astype(str) + " " + df['abstract'].astype(str)

In [11]:
print(df.head())

                                               title  \
0  Proceedings of the 8th Workshop on Online Abus...   
1  Investigating radicalisation indicators in onl...   
2  Detection of Conspiracy Theories Beyond Keywor...   
3  {E}ko{H}ate: Abusive Language and Hate Speech ...   
4  A Study of the Class Imbalance Problem in Abus...   

                                              author  \
0                                                      
1              De Kock, Christine  and\nHovy, Eduard   
2  Pustet, Milena  and\nSteffen, Elisabeth  and\n...   
3  Ilevbare, Comfort  and\nAlabi, Jesujoba  and\n...   
4  Zhang, Yaqi  and\nHangya, Viktor  and\nFraser,...   

                                           booktitle  year  \
0                                                     2024   
1  Proceedings of the 8th Workshop on Online Abus...  2024   
2  Proceedings of the 8th Workshop on Online Abus...  2024   
3  Proceedings of the 8th Workshop on Online Abus...  2024   
4  Proceedings o

In [12]:
print(df['title-abstract'].head())

0    Proceedings of the 8th Workshop on Online Abus...
1    Investigating radicalisation indicators in onl...
2    Detection of Conspiracy Theories Beyond Keywor...
3    {E}ko{H}ate: Abusive Language and Hate Speech ...
4    A Study of the Class Imbalance Problem in Abus...
Name: title-abstract, dtype: object


In [13]:
df.to_csv('acl_all_080524.csv', index=False)

In [40]:
emp_eldar = Query('empath* AND (detect* OR recog* OR predict* OR classi*)', ignore_case=True, ignore_accent=True, match_word=True)
emo_eldar = Query('emot* AND (detect* OR recog* OR predict* OR classi*)', ignore_case=True, ignore_accent=True, match_word=True)

In [41]:
emp_res = df[df['title-abstract'].apply(emp_eldar)]
emo_res = df[df['title-abstract'].apply(emo_eldar)]

In [42]:
print("Empathy-related papers found:", emp_res.shape[0])
print("Emotion-related papers found:", emo_res.shape[0])

Empathy-related papers found: 101
Emotion-related papers found: 1053


In [43]:
emp_res

Unnamed: 0,title,author,booktitle,year,url,abstract,title-abstract
1048,Improved Text Emotion Prediction Using Combine...,"Mitsios, Michail and\nVamvoukakis, Georgios ...",Proceedings of the 2024 Conference of the Nort...,2024,https://aclanthology.org/2024.naacl-short.72,Emotion detection in textual data has received...,Improved Text Emotion Prediction Using Combine...
1224,Modeling Empathetic Alignment in Conversation,"Yang, Jiamin and\nJurgens, David",Proceedings of the 2024 Conference of the Nort...,2024,https://aclanthology.org/2024.naacl-long.172,Empathy requires perspective-taking: empatheti...,Modeling Empathetic Alignment in Conversation ...
1748,{A}cn{E}mpathize: A Dataset for Understanding ...,"Lee, Gyeongeun and\nParde, Natalie",Proceedings of the 2024 Joint International Co...,2024,https://aclanthology.org/2024.lrec-main.13,Empathy is critical for effective communicatio...,{A}cn{E}mpathize: A Dataset for Understanding ...
1859,Appraisal Framework for Clinical Empathy: A No...,"Lahnala, Allison Claire and\nNeuendorf, B{\'e...",Proceedings of the 2024 Joint International Co...,2024,https://aclanthology.org/2024.lrec-main.124,Empathy is essential in healthcare communicati...,Appraisal Framework for Clinical Empathy: A No...
1875,{ASEM}: Enhancing Empathy in Chatbot through A...,"Hamad, Omama and\nShaban, Khaled and\nHamdi,...",Proceedings of the 2024 Joint International Co...,2024,https://aclanthology.org/2024.lrec-main.140,Effective feature representations play a criti...,{ASEM}: Enhancing Empathy in Chatbot through A...
...,...,...,...,...,...,...,...
50121,Social and linguistic behavior and its correla...,"Litvak, Marina and\nOtterbacher, Jahna and\n...",Proceedings of the Workshop on Computational M...,2016,https://aclanthology.org/W16-4314,A growing body of research exploits social med...,Social and linguistic behavior and its correla...
51739,{Z}ara The {S}upergirl: An Empathetic Personal...,"Fung, Pascale and\nDey, Anik and\nSiddique, ...",Proceedings of the 2016 Conference of the Nort...,2016,https://aclanthology.org/N16-3018,,{Z}ara The {S}upergirl: An Empathetic Personal...
53116,{Z}ara: A Virtual Interactive Dialogue System ...,"Fung, Pascale and\nDey, Anik and\nSiddique, ...","Proceedings of {COLING} 2016, the 26th Interna...",2016,https://aclanthology.org/C16-2058,"Zara, or {`}Zara the Supergirl{'} is a virtual...",{Z}ara: A Virtual Interactive Dialogue System ...
53193,How Interlocutors Coordinate with each other w...,"Alam, Firoj and\nChowdhury, Shammur Absar an...","Proceedings of {COLING} 2016, the 26th Interna...",2016,https://aclanthology.org/C16-1070,"In this paper, we aim to investigate the coord...",How Interlocutors Coordinate with each other w...


In [44]:
emo_res

Unnamed: 0,title,author,booktitle,year,url,abstract,title-abstract
9,Estimating the Emotion of Disgust in {G}reek P...,"Lislevand, Vanessa and\nPavlopoulos, John an...",Proceedings of the 8th Workshop on Online Abus...,2024,https://aclanthology.org/2024.woah-1.9,We present an analysis of the sentiment in Gre...,Estimating the Emotion of Disgust in {G}reek P...
34,Topic Bias in Emotion Classification,"Wegge, Maximilian and\nKlinger, Roman",Proceedings of the Ninth Workshop on Noisy and...,2024,https://aclanthology.org/2024.wnut-1.9,Emotion corpora are typically sampled based on...,Topic Bias in Emotion Classification Emotion c...
38,{E}mo{M}ix-3{L}: A Code-Mixed Dataset for {B}a...,"Raihan, Nishat and\nGoswami, Dhiman and\nMah...",Proceedings of the 7th Workshop on Indian Lang...,2024,https://aclanthology.org/2024.wildre-1.2,Code-mixing is a well-studied linguistic pheno...,{E}mo{M}ix-3{L}: A Code-Mixed Dataset for {B}a...
142,"Ice and Fire: Dataset on Sentiment, Emotions, ...","Fri{\dh}riksd{\'o}ttir, Steinunn Rut and\nSim...","Proceedings of the Fourth Workshop on Threat, ...",2024,https://aclanthology.org/2024.trac-1.9,"This study introduces {``}Ice and Fire,{''} a ...","Ice and Fire: Dataset on Sentiment, Emotions, ..."
147,"Offensiveness, Hate, Emotion and {GPT}: Benchm...","Bauer, Nikolaj and\nPreisig, Moritz and\nVol...","Proceedings of the Fourth Workshop on Threat, ...",2024,https://aclanthology.org/2024.trac-1.14,"In this paper, we extend the work of benchmark...","Offensiveness, Hate, Emotion and {GPT}: Benchm..."
...,...,...,...,...,...,...,...
82287,Multi-Modal Emotion Recognition from Speech an...,"Chuang, Ze-Jing and\nWu, Chung-Hsien",International Journal of Computational Linguis...,2004,https://aclanthology.org/O04-3004,,Multi-Modal Emotion Recognition from Speech an...
82336,Detecting Emotions in {M}andarin Speech,"Pao, Tsang-Long and\nChen, Yu-Te and\nYeh, J...",Proceedings of the 16th Conference on Computat...,2004,https://aclanthology.org/O04-1038,,Detecting Emotions in {M}andarin Speech
82428,Predicting Emotion in Spoken Dialogue from Mul...,"Forbes-Riley, Kate and\nLitman, Diane",Proceedings of the Human Language Technology C...,2004,https://aclanthology.org/N04-1026,,Predicting Emotion in Spoken Dialogue from Mul...
82618,{``}You Stupid Tin Box{''} - Children Interact...,"Batliner, A. and\nHacker, C. and\nSteidl, S....",Proceedings of the Fourth International Confer...,2004,http://www.lrec-conf.org/proceedings/lrec2004/...,This paper deals with databases that combine d...,{``}You Stupid Tin Box{''} - Children Interact...


In [45]:
emp_res.to_csv('acl_empathy_related_papers.csv', index=False)
emo_res.to_csv('acl_emotion_related_papers.csv', index=False)