## Research Papers: Filtering

In [1]:
import pandas as pd


In [2]:
all_papers = pd.read_csv("Combined Papers.csv")
all_papers.sample(5)

Unnamed: 0,Title,Authors,DOI,URLs,Notes,Abstract
794,Podcasting in nursing and midwifery education:...,"O'Connor, S; Daly, CS; MacArthur, J; Borglin, ...",10.1016/j.nepr.2020.102827,http://dx.doi.org/10.1016/j.nepr.2020.102827,,Podcasting is used in higher education so vari...
1084,The use of gaze to control drones,"Hansen J.P., Alapetite A., MacKenzie I.S., Møl...",10.1145/2578153.2578156,https://www.scopus.com/inward/record.uri?eid=2...,,This paper presents an experimental investigat...
968,Empowerment and embodiment for collaborative m...,"Pan Y,Sinclair D,Mitchell K",10.1002/cav.1838,https://onlinelibrary.wiley.com/doi/abs/10.100...,e1838 cav.1838,Abstract We present several mixed-reality-base...
1045,Aligning the real and the virtual world: Mixed...,"Radanovic M,Khoshelham K,Fraser C",10.1016/j.aei.2023.101960,https://www.sciencedirect.com/science/article/...,,Existing camera localisation methods for indoo...
1424,Process characterization and evaluation of NC ...,"Minoufekr M., Schug P., Joshi M.",10.5220/0005054606610670,https://www.scopus.com/inward/record.uri?eid=2...,,"With a view to achieve stable production, nowa..."


In [3]:
all_papers.shape

(1435, 6)

#### Remove Duplicates

In [4]:
all_papers.drop_duplicates(subset='Title', inplace=True)  # Remove duplicate titles

In [5]:
all_papers.shape

(1234, 6)

In [6]:
all_papers.columns

Index(['Title', 'Authors', 'DOI', 'URLs', 'Notes', 'Abstract'], dtype='object')

### Filter out papers 

#### Title Filtering

In [27]:
"""
We choose two sets of keywords: Any two combination of these keywords makes the paper relevant 
for this research work
"""
title_keywords1 = ["virtual reality", "virtual environment", "immersive technology", "immersion", "augmented reality"]

title_keywords2 = ["reliability", "credibility", "trustworthiness", "trust", "presence", "user experience", "believability"]

In [28]:
"""
A method that filters the papers based on keyword presence in the title"""
def filter_title(title):
    title_lower = title.lower()
    return any(word in title_lower for word in title_keywords1) and \
           any(word in title_lower for word in title_keywords1)


In [29]:
# Apply the method
filtered_title = all_papers[all_papers['Title'].astype(str).apply(filter_title)]

filtered_title

Unnamed: 0,Title,Authors,DOI,URLs,Notes,Abstract
1,Scaffolding Spatial Ability with Augmented Rea...,"Wong J,Yu K,Giacaman N",10.1504/ijmlo.2021.111597,https://doi.org/10.1504/ijmlo.2021.111597;http...,,Spatial ability is believed to aid comprehensi...
2,Augmented and Virtual Reality-Driven Intervent...,"Paul Odenigbo I,AlSlaity A,Orji R",10.1145/3505284.3529964,https://doi.org/10.1145/3505284.3529964;http:/...,,Augmented Reality (AR) and Virtual Reality (VR...
5,Digital Learning Environments - Constructing A...,"Somerkoski B,Oliva D,Tarkkanen K,Luimula M",10.1145/3377571.3377615,https://doi.org/10.1145/3377571.3377615;http:/...,,This article gives examples of how the use of ...
10,CryptoAR Wallet: A Blockchain Cryptocurrency W...,"Chen YP,Ko JC",10.1145/3338286.3344386,https://doi.org/10.1145/3338286.3344386;http:/...,,Blockchain technology has recently become popu...
13,Nonverbal Behavior of Interviewers Influences ...,"Wyssenbach T,Zeballos M,Loosli S,Schwaninger A",10.1007/s10055-021-00540-3,https://doi.org/10.1007/s10055-021-00540-3;htt...,,This study examined whether an interviewer’s n...
...,...,...,...,...,...,...
1406,Edge computing enabled mobile augmented realit...,"Liu J., Zhang Q.",,https://www.scopus.com/inward/record.uri?eid=2...,,Mobile edge computing (MEC) is one of the prom...
1413,pp. 251-265; Saggio G. & Ferrari M. (2012)-Ne...,eas (2013) Natural Hazards,Papa,M.N.,J.,Dam-break flows of dry granular materials on ...
1423,Incorporating augmented reality into learning ...,"Hsu Y.-S., Lin Y.-H., Yang B., Yang S.-F., Cha...",,https://www.scopus.com/inward/record.uri?eid=2...,,"In this paper, we demonstrate how to incorpora..."
1433,Research into the method for construction of i...,"Deng J., Zheng X.",10.1117/12.872843,https://www.scopus.com/inward/record.uri?eid=2...,,"Nowadays, the development of Digital Earth has..."


In [30]:
filtered_title.shape

(539, 6)

#### Abstract filtering

In [88]:
# Apply filtering conditions
#filtered_abstract = all_papers[all_papers["Abstract"].astype(str).apply(lambda x: sum(keyword.lower() in x.lower() for keyword in keywords) >= 3)]

In [24]:
abstract_keywords1 = ["virtual reality", "virtual environment", "immersive technology", "immersion", "augmented reality"]
abstract_keywords2 = ["reliability", "credibility", "trust", "trustworthy", "believability", "believable"]
abstract_keywords3 = ["presence","user experience", "user perception", "usability"]

In [18]:
def filter_abstract(abstract):
    abstract_lower = abstract.lower()
    return any(word in abstract_lower for word in abstract_keywords1) and \
           any(word in abstract_lower for word in abstract_keywords2) and \
           any(word in abstract_lower for word in abstract_keywords3)

In [31]:
filtered_data = filtered_title[filtered_title['Abstract'].astype(str).apply(filter_abstract)]

# Print the filtered DataFrame
filtered_data["Title"].head()

10    CryptoAR Wallet: A Blockchain Cryptocurrency W...
16    How Should Automated Vehicles Interact with Pe...
18    A Fluid Human Interactive Proof in Virtual Env...
24    AI-Assisted Affective Computing and Spatial Au...
25    "You Better Eat to Survive": Exploring Coopera...
Name: Title, dtype: object

In [32]:
filtered_data.shape

(91, 6)

In [33]:
filtered_data.to_csv("output1.csv")