In [1]:
import pandas as pd
from pybtex.database.input import bibtex

#### Parse a bibtex file and store in DataFrame  

In [2]:
parser = bibtex.Parser()
bibdata = parser.parse_file("aies-papers.bib")
bib_list = []

In [3]:
#loop through the individual references
for bib_id in bibdata.entries:
    b = bibdata.entries[bib_id].fields
    bib_list.append(b)

In [4]:
bib_df = pd.DataFrame(bib_list)
bib_df.head()

Unnamed: 0,abstract,address,booktitle,doi,isbn,keywords,location,numpages,pages,publisher,series,title,url,year
0,Clinical notes are becoming an increasingly im...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534203,9781450392471,"natural language processing, clinical notes, h...","Oxford, United Kingdom",15,7–21,Association for Computing Machinery,AIES '22,Write It Like You See It: Detectable Differenc...,https://doi.org/10.1145/3514094.3534203,2022
1,Recommender system fairness has been studied f...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534173,9781450392471,"fairness, machine learning, recommender systems","Oxford, United Kingdom",14,22–35,Association for Computing Machinery,AIES '22,Long-Term Dynamics of Fairness Intervention in...,https://doi.org/10.1145/3514094.3534173,2022
2,We propose a solution for intelligent househol...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534152,9781450392471,"Garbage Management, Vehicle Routing Problem, E...","Oxford, United Kingdom",10,36–45,Association for Computing Machinery,AIES '22,Dynamic Fleet Management and Household Feedbac...,https://doi.org/10.1145/3514094.3534152,2022
3,"This paper proposes SCALES, a general framewor...","New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534190,9781450392471,"fairness, constrained reinforcement learning","Oxford, United Kingdom",10,46–55,Association for Computing Machinery,AIES '22,SCALES: From Fairness Principles to Constraine...,https://doi.org/10.1145/3514094.3534190,2022
4,With the increasing pervasiveness of algorithm...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534145,9781450392471,"anticipatory governance, broader impacts, ai e...","Oxford, United Kingdom",12,56–67,Association for Computing Machinery,AIES '22,Crowdsourcing Impacts: Exploring the Utility o...,https://doi.org/10.1145/3514094.3534145,2022


#### Keyword Search in abstract column

In [5]:
bias = ['bias', 'fairness', 'equitable']
bias_pattern = '|'.join(bias)

bias_pattern

'bias|fairness|equitable'

#### Printing rows containing keywords

In [6]:
bib_df.loc[bib_df.abstract.str.contains(bias_pattern)].reset_index().head()

Unnamed: 0,index,abstract,address,booktitle,doi,isbn,keywords,location,numpages,pages,publisher,series,title,url,year
0,0,Clinical notes are becoming an increasingly im...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534203,9781450392471,"natural language processing, clinical notes, h...","Oxford, United Kingdom",15,7–21,Association for Computing Machinery,AIES '22,Write It Like You See It: Detectable Differenc...,https://doi.org/10.1145/3514094.3534203,2022
1,1,Recommender system fairness has been studied f...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534173,9781450392471,"fairness, machine learning, recommender systems","Oxford, United Kingdom",14,22–35,Association for Computing Machinery,AIES '22,Long-Term Dynamics of Fairness Intervention in...,https://doi.org/10.1145/3514094.3534173,2022
2,3,"This paper proposes SCALES, a general framewor...","New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534190,9781450392471,"fairness, constrained reinforcement learning","Oxford, United Kingdom",10,46–55,Association for Computing Machinery,AIES '22,SCALES: From Fairness Principles to Constraine...,https://doi.org/10.1145/3514094.3534190,2022
3,6,The field of eXplainable Artificial Intelligen...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534164,9781450392471,"cognitive bias, xai., human-centered ai, expla...","Oxford, United Kingdom",14,78–91,Association for Computing Machinery,AIES '22,How Cognitive Biases Affect XAI-Assisted Decis...,https://doi.org/10.1145/3514094.3534164,2022
4,7,Artificial Intelligence startups use training ...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534195,9781450392471,"AI, scale barriers, startups, ethics, data","Oxford, United Kingdom",15,92–106,Association for Computing Machinery,AIES '22,The Cost of Ethical AI Development for AI Star...,https://doi.org/10.1145/3514094.3534195,2022


In [6]:
bib_df.to_excel("aies_bib.xlsx")

Import category .XLSX

### Manually labelled categories

1. Bias and Fairness
2. Ethics
3. Policy and Governance
4. Sociology and Societal Impact
5. Explainability and Trust
6. Alignment/Machine Ethics

In [7]:
bib_df_cat = pd.read_excel("aies_bib_cat.xlsx")
bib_df_cat.head()

Unnamed: 0.1,Unnamed: 0,abstract,address,booktitle,doi,isbn,keywords,location,numpages,pages,publisher,series,title,url,year,category
0,0,Clinical notes are becoming an increasingly im...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534203,9781450392471,"natural language processing, clinical notes, h...","Oxford, United Kingdom",15,7–21,Association for Computing Machinery,AIES '22,Write It Like You See It: Detectable Differenc...,https://doi.org/10.1145/3514094.3534203,2022,bias
1,1,Recommender system fairness has been studied f...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534173,9781450392471,"fairness, machine learning, recommender systems","Oxford, United Kingdom",14,22–35,Association for Computing Machinery,AIES '22,Long-Term Dynamics of Fairness Intervention in...,https://doi.org/10.1145/3514094.3534173,2022,bias
2,2,We propose a solution for intelligent househol...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534152,9781450392471,"Garbage Management, Vehicle Routing Problem, E...","Oxford, United Kingdom",10,36–45,Association for Computing Machinery,AIES '22,Dynamic Fleet Management and Household Feedbac...,https://doi.org/10.1145/3514094.3534152,2022,ethics
3,3,"This paper proposes SCALES, a general framewor...","New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534190,9781450392471,"fairness, constrained reinforcement learning","Oxford, United Kingdom",10,46–55,Association for Computing Machinery,AIES '22,SCALES: From Fairness Principles to Constraine...,https://doi.org/10.1145/3514094.3534190,2022,bias
4,4,With the increasing pervasiveness of algorithm...,"New York, NY, USA",Proceedings of the 2022 AAAI/ACM Conference on...,10.1145/3514094.3534145,9781450392471,"anticipatory governance, broader impacts, ai e...","Oxford, United Kingdom",12,56–67,Association for Computing Machinery,AIES '22,Crowdsourcing Impacts: Exploring the Utility o...,https://doi.org/10.1145/3514094.3534145,2022,policy


Print count of categories

In [8]:
bib_df_cat.groupby("category")["title"].count()

category
align      8
bias      23
ethics    16
policy    10
soc       10
xai       11
Name: title, dtype: int64

In [9]:
bib_df_cat["category"].to_csv("categories.csv")