## FILTERING PUBLICATIONS FOR RESEARCH WORK

In [291]:
import pandas as pd
import bibtexparser
import chardet
from collections import Counter

### Processing Papers from IEEE

In [292]:
ieee_papers = pd.read_csv("souced/IEEE_final.csv")
ieee_papers.head()

Unnamed: 0,Document Title,Authors,Author Affiliations,Publication Title,Date Added To Xplore,Publication Year,Volume,Issue,Start Page,End Page,...,Mesh_Terms,Article Citation Count,Patent Citation Count,Reference Count,License,Online Date,Issue Date,Meeting Date,Publisher,Document Identifier
0,Reliability of phantom pain relief in neuroreh...,Y. Sano; A. Ichinose; N. Wake; M. Osumi; M. Su...,"The Department of Mechano- Informatics, The Un...",2015 37th Annual International Conference of t...,5 Nov 2015,2015,,,2482,2485,...,Humans;Neurological Rehabilitation;Phantom Lim...,8.0,,18.0,IEEE,5 Nov 2015,,,IEEE,IEEE Conferences
1,Research of interactive experience display of ...,W. Zhang; Y. Zhang,"Digital Media Technology, Jiangsu University, ...",2020 International Conference on Innovation De...,30 Aug 2021,2020,,,367,372,...,,,,12.0,IEEE,30 Aug 2021,,,IEEE,IEEE Conferences
2,Investigating Spherical Fish Tank Virtual Real...,G. Hagemann; Q. Zhou; I. Stavness; S. Fels,University of British Columbia LMU Munich; Uni...,2019 IEEE Conference on Virtual Reality and 3D...,15 Aug 2019,2019,,,950,951,...,,,,14.0,IEEE,15 Aug 2019,,,IEEE,IEEE Conferences
3,Cooperative node selection scheme based on cre...,D. Hao; Y. Chen; Y. Wang,"Xijing University, Xi’an, China; Xijing Univer...",2020 International Conference on Virtual Reali...,21 Sep 2021,2020,,,780,782,...,,1.0,,6.0,IEEE,21 Sep 2021,,,IEEE,IEEE Conferences
4,Design of e-commerce logistics distribution pa...,L. Min,Shandong College of Electronic Technology China,2020 International Conference on Virtual Reali...,21 Sep 2021,2020,,,38,41,...,,,,10.0,IEEE,21 Sep 2021,,,IEEE,IEEE Conferences


In [323]:
ieee_papers.shape


(545, 33)

In [293]:
ieee_papers["Document Title"].iloc[97]

'VR-HMD Eye Tracker in Active Visual Field Testing'

### Processing Papers from scopus

In [294]:
scopus_papers = pd.read_csv("souced/Scopus_exported_refine_values1.csv")
scopus_papers.columns

Index(['YEAR', 'Unnamed: 1', 'AUTHOR NAME', 'Unnamed: 3', 'SUBJECT AREA',
       'Unnamed: 5', 'SOURCE TITLE', 'Unnamed: 7', 'KEYWORD', 'Unnamed: 9',
       'AFFILIATION', 'Unnamed: 11', 'FUNDING SPONSOR', 'Unnamed: 13',
       'COUNTRY', 'Unnamed: 15'],
      dtype='object')

In [295]:
scopus_papers["SOURCE TITLE"]

0      Proceedings Of SPIE The International Society ...
1      Proceedings Electronic Components And Technolo...
2                                            IEEE Access
3         ACM International Conference Proceeding Series
4                        Journal Of Electronic Materials
                             ...                        
155    Proceedings Of The 24th Electronics Packaging ...
156    Proceedings Of The ACM Symposium On Applied Co...
157    Proceedings Of The Annual International Confer...
158    Proceedings Of The European Safety And Reliabi...
159                                            Undefined
Name: SOURCE TITLE, Length: 160, dtype: object

In [296]:
scopus =pd.read_csv('souced/new sciencedirect/ScienceDirect_citations_1683302487066.txt', delimiter='\t', encoding='utf-8')

In [297]:
scopus.sample(10)

Unnamed: 0,"C.Y. Lee, S.P. Yang, C.H. Yang, M.K. Lu, T.T. Kuo, C.E. Ho,"
201,https://doi.org/10.1016/j.corsci.2011.09.017.
226,Keywords: In–50Sn alloy; Photovoltaic ribbon; ...
570,"Separation and Purification Technology,"
214,Abstract: This paper reviews the state-of-the-...
402,"ISSN 0304-3894,"
582,"Volume 687,"
142,"Volume 21,"
450,Keywords: Residue dating; Residue analysis; AM...
310,(https://www.sciencedirect.com/science/article...
479,"ISSN 0022-3093,"


In [298]:
# df = pd.read_csv('souced/new sciencedirect/ScienceDirect_citations_1683302487066.txt', sep='\n', header=None)

In [299]:
# widths = [1] * 10  # specify the width of each column as 1
# df = pd.read_fwf('souced/new sciencedirect/ScienceDirect_citations_1683302487066.txt', widths=widths, header=None)
# df

### Processing Papers from ACM

In [300]:
# get the encoding for tis file
with open("souced/acm_final.bib", 'rb') as f:
    result = chardet.detect(f.read())

encoding = result['encoding']
encoding

# open the file with the right encoding
with open("souced/acm_final.bib", 'r', encoding=encoding) as bibtex_file:
    bib_database = bibtexparser.load(bibtex_file)
print(bib_database)

<bibtexparser.bibdatabase.BibDatabase object at 0x0000022171BDF3A0>


In [301]:
for entry in bib_database.entries:
    #print(f"Title: {entry['title']}")
    pass

In [302]:
# Extract data from entries
data = []
for entry in bib_database.entries:
    row = {
        'author(s)': entry.get('author', ''),
        'title': entry.get('title', ''),
        'year': entry.get('year', ''),
        'isbn': entry.get('isbn', ''),
        'publisher': entry.get('publisher', ''),
        'address': entry.get('year', ''),
        'url': entry.get('url', ''),
        'doi': entry.get('doi', ''),
        'abstract': entry.get('abstract', ''),
        'booktitle': entry.get('booktitle', ''),
        'pages': entry.get('pages', ''),
        'numpages': entry.get('numpages', ''),
        'keywords': entry.get('keywords', ''),
        'location': entry.get('location', ''),
        'series': entry.get('series', '')
    }
    data.append(row)

In [303]:
acm_papers= pd.DataFrame(data)
acm_papers

Unnamed: 0,author(s),title,year,isbn,publisher,address,url,doi,abstract,booktitle,pages,numpages,keywords,location,series
0,"Sagheb, Shahabedin and Liu, Frank Wencheng and...",SWISH: A Shifting-Weight Interface of Simulate...,2019,9781450368162,Association for Computing Machinery,2019,https://doi.org/10.1145/3332165.3347870,10.1145/3332165.3347870,Current VR/AR systems are unable to reproduce ...,Proceedings of the 32nd Annual ACM Symposium o...,751‚Äì761,11,"ungrounded haptic feedback, fluid dynamics, vi...","New Orleans, LA, USA",UIST '19
1,"Zhang, Dong and Li, Wenhang and Li, Yi and Gon...",A Group Activity Analysis Method Based on Imme...,2018,9781450365192,Association for Computing Machinery,2018,https://doi.org/10.1145/3289430.3289443,10.1145/3289430.3289443,Group activity analysis is important for crowd...,Proceedings of the 2018 2nd International Conf...,110‚Äì113,4,"Emergency Management, Virtual Geographic Envir...","Beijing, China",BDIOT 2018
2,"Liang, Hui and Ge, Chao and Liang, Fei and Sun...",Training Model of Safe Escape From Fire Based ...,2020,9781450377027,Association for Computing Machinery,2020,https://doi.org/10.1145/3375998.3376013,10.1145/3375998.3376013,The popularization of virtual reality equipmen...,Proceedings of the 2019 8th International Conf...,168‚Äì175,8,"safety training, Virtual reality, disaster eva...","Luoyang, China",ICNCC '19
3,"Olade, Ilesanmi and Liang, Hai-Ning and Flemin...",Exploring the Vulnerabilities and Advantages o...,2020,9781450376945,Association for Computing Machinery,2020,https://doi.org/10.1145/3385378.3385385,10.1145/3385378.3385385,Virtual reality applications are carving out a...,Proceedings of the 2020 4th International Conf...,45‚Äì52,8,"Authentication, Security, Pattern, Virtual rea...","Sydney, NSW, Australia",ICVARS 2020
4,"Csutak, Zsolt",Virtual Universes: The Various Impacts of Cons...,2022,9781450397667,Association for Computing Machinery,2022,https://doi.org/10.1145/3551504.3551515,10.1145/3551504.3551515,The so-called post-postmodern cyber era is spe...,Proceedings of the Central and Eastern Europea...,69‚Äì72,4,"Digital technologies, Media literacy, News awa...","Budapest, Hungary",CEEeGov '22
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
995,"Hwang, Jinho and Shwartz, Larisa and Wang, Qin...",FIXME: Enhance Software Reliability with Hybri...,2021,9780738146690,IEEE Press,2021,https://doi.org/10.1109/ICSE-SEIP52600.2021.00032,10.1109/ICSE-SEIP52600.2021.00032,"With the promise of reliability in cloud, more...",Proceedings of the 43rd International Conferen...,228‚Äì237,10,"cloud, event management, event correlation, hy...","Virtual Event, Spain",ICSE-SEIP '21
996,"Moin, Ali and Nuzzo, Pierluigi and Sangiovanni...",Optimized Design of a Human Intranet Network,2017,9781450349277,Association for Computing Machinery,2017,https://doi.org/10.1145/3061639.3062296,10.1145/3061639.3062296,We address the design space exploration of wir...,Proceedings of the 54th Annual Design Automati...,,6,,"Austin, TX, USA",DAC '17
997,"Mao, Zhijie and Wu, Guangen and Zhou, Lin",A 6G Oriented High-Throughput Satellite Commun...,2021,9781450389853,Association for Computing Machinery,2021,https://doi.org/10.1145/3487075.3487140,10.1145/3487075.3487140,The integration of satellite communication sys...,Proceedings of the 5th International Conferenc...,,5,"MAPSK, 6G wireless communication, Bit error ra...","Sanya, China",CSAE '21
998,"Shin, Hocheol and Noh, Juhwan and Kim, Dohyun ...",The System That Cried Wolf: Sensor Security An...,2020,,Association for Computing Machinery,2020,https://doi.org/10.1145/3393926,10.1145/3393926,Fire alarm and signaling systems are a network...,,,32,"fire alarm and signaling system, sensing and a...",,


#### Access and clean the data

In [304]:
acm_papers["pages"]

0      751‚Äì761
1      110‚Äì113
2      168‚Äì175
3        45‚Äì52
4        69‚Äì72
         ...    
995    228‚Äì237
996             
997             
998             
999             
Name: pages, Length: 1000, dtype: object

In [305]:
acm_papers['pages'] = acm_papers['pages'].str.replace('‚Äì', '-')

In [306]:
acm_papers["pages"]

0      751-761
1      110-113
2      168-175
3        45-52
4        69-72
        ...   
995    228-237
996           
997           
998           
999           
Name: pages, Length: 1000, dtype: object

In [307]:
# save to csv

acm_papers.to_csv("souced/acm_papers.csv")

### Processing papers from science direct

In [308]:
# # Open the text file and read the contents
# with open('souced/new sciencedirect/ScienceDirect_citations.txt', 'r', encoding='utf-8') as file:
#     lines = file.readlines()

# books = []
# current_book = {}

# # Iterate over the lines in the file
# for line in lines:
#     # Check if the line contains author names
#     if ',' in line:
#         if 'Author Names' in current_book:
#             books.append(current_book)
#             current_book = {}
#         authors = line.strip()
#         # Check if author names span multiple lines
#         while not authors.endswith(','):
#             line = next(lines)
#             authors += ' ' + line.strip()
#         current_book['Author Names'] = authors
    
#     # Check if the line contains the title of the book
#     elif ':' in line and 'Abstract' not in line and 'Keywords' not in line:
#         title = line.split(':')[1].strip()
#         # Check if title spans multiple lines
#         while not title.endswith('.'):
#             line = next(lines)
#             title += ' ' + line.strip()
#         current_book['Title'] = title
    
#     # Check if the line contains the year the book was written
#     elif ',' in line and len(line.strip().split()) == 2:
#         year = line.strip().split()[0]
#         current_book['Year'] = year
    
#     # Check if the line contains the abstract
#     elif line.startswith('Abstract:'):
#         abstract = ''
#         # Append lines to the abstract until we reach the keywords
#         while not line.startswith('Keywords:'):
#             line = next(lines)
#             abstract += line.strip() + ' '
#         current_book['Abstract'] = abstract.strip()
    
#     # Check if the line contains the keywords
#     elif line.startswith('Keywords:'):
#         keywords = line.split(':')[1].strip()
#         current_book['Keywords'] = keywords

# # Append the last book to the list
# if current_book:
#     books.append(current_book)

# # Create a Pandas DataFrame from the list of books
# df = pd.DataFrame(books)

# # Write the data to a CSV file
# df.to_csv('book_descriptions.csv', index=False)


### Filtering Papers 

In [309]:
'''
Create a search function that computes percentage occurence of keywords in the title/abstract.
We extract document with occurence level that is passed as an argument into the function.
'''
search_keywords = ['trustworthiness', 'reliability', 'mixed', 'virtual', 'reality', 'credibility', 'immersion']
def filter_papers(document, keywords, column, acceptance_rate):
    document["occurence"]= 0
    document["keywords"] = None
    document["key_words_count"]= 0
    percent = []
    count = []
    for index in range(len(document)):
        #doc = document[index].lower()
        words_in_title = document[column].iloc[index].lower().replace(",", " ").split(" ")
        keywords_found = []
        for word in keywords:
            if word in words_in_title:
                keywords_found.append(word)
        keyword_unique = set(keywords_found)
        percent_occurrence = round((len(keyword_unique) / len(keywords)) * 100)
        percent.append(percent_occurrence)
        cnt = len(keyword_unique)
        count.append(cnt)
        document.at[index, 'occurence'] = percent_occurrence
        document.at[index, 'keywords'] = keyword_unique
        document.at[index, 'key_words_count'] = int(cnt)
    
    document = document.sort_values('occurence', ascending=False)

    
    # select documents more 20% occurence level
    selected_docs = document[document["occurence"] > acceptance_rate]
    
    return selected_docs
    

### Filtering the IEEE papers with an acceptance occurence rate of 20%

In [310]:
ieee_papers_title_filters = filter_papers(ieee_papers, search_keywords, "Document Title", 20)


In [311]:
ieee_papers_title_filters.to_csv("title_only.csv")

In [312]:
ieee_papers_title_filters["Document Title"]

5     The Effect of Virtual Humans Making Verbal Com...
0     Reliability of phantom pain relief in neuroreh...
62    A Basic Psychophysics Study of Sound Reliabili...
33    On the Reliability of Wireless Virtual Reality...
34    Virtual Reality based test batteries for evalu...
                            ...                        
4     Design of e-commerce logistics distribution pa...
25    Utilizing Virtual Reality to Enhance the Digit...
6     The Effects of a Stressful Physical Environmen...
53    Interaction techniques using head gaze for vir...
52    Correction Method of Key Movements in Basketba...
Name: Document Title, Length: 102, dtype: object

In [313]:
ieee_papers_title_filters["Document Title"].iloc[97]

'Design of e-commerce logistics distribution path display system based on virtual reality technology'

#### Filtering Based on the Abstract, with acceptance occurence rate of more than 40%.
<br>
To perform the advanced filtering on the the selected titles based on the IEEE title filtering, we used those papers selected and filtered based on the abstract.

In [314]:
ieee_papers_title_filters.columns

Index(['Document Title', 'Authors', 'Author Affiliations', 'Publication Title',
       'Date Added To Xplore', 'Publication Year', 'Volume', 'Issue',
       'Start Page', 'End Page', 'Abstract', 'ISSN', 'ISBNs', 'DOI',
       'Funding Information', 'PDF Link', 'Author Keywords', 'IEEE Terms',
       'INSPEC Controlled Terms', 'INSPEC Non-Controlled Terms', 'Mesh_Terms',
       'Article Citation Count', 'Patent Citation Count', 'Reference Count',
       'License', 'Online Date', 'Issue Date', 'Meeting Date', 'Publisher',
       'Document Identifier', 'occurence', 'keywords', 'key_words_count'],
      dtype='object')

In [325]:
ieee_papers_title=pd.read_csv("title_only.csv")
ieee_papers_title.sample(10)

Unnamed: 0.1,Unnamed: 0,Document Title,Authors,Author Affiliations,Publication Title,Date Added To Xplore,Publication Year,Volume,Issue,Start Page,...,Reference Count,License,Online Date,Issue Date,Meeting Date,Publisher,Document Identifier,occurence,keywords,key_words_count
34,375,Situation display system of USV auxiliary navi...,L. Zhang; Y. Zhao; Y. Fan,"College of Marine Electrical Engineering, Dali...",2022 7th International Conference on Automatio...,25 Jul 2022,2022,,,245,...,12.0,IEEE,25 Jul 2022,,,IEEE,IEEE Conferences,29,"{'virtual', 'reality'}",2
20,89,Correction Method of Basketball Shooting Error...,W. Yang; H. Yi,"Nan Chang Business College of Jxau, Gongqing C...",2022 Global Reliability and Prognostics and He...,14 Nov 2022,2022,,,1,...,15.0,IEEE,14 Nov 2022,,,IEEE,IEEE Conferences,29,"{'virtual', 'reality'}",2
55,140,Monitoring virtual metrology reliability in a ...,D. Kurz; C. De Luca; J. Pilz,Alpen-Adria University (AAU) of Klagenfurt Inf...,2013 IEEE International Conference on Automati...,7 Nov 2013,2013,,,20,...,6.0,IEEE,7 Nov 2013,,,IEEE,IEEE Conferences,29,"{'reliability', 'virtual'}",2
7,103,Application of Internet of Things and Virtual ...,Y. Ding; Y. Li; L. Cheng,"Department of Physical Education, Northwest Un...",IEEE Access,2 Jun 2020,2020,8.0,,96065,...,30.0,CCBY,11 May 2020,,,IEEE,IEEE Journals,29,"{'virtual', 'reality'}",2
90,21,A maintenance influencing factor evaluation me...,C. Dai; S. Wu; Q. Tang; S. Liu; B. Liu,"Quality and Reliability Center, CSSC China Ins...","12th International Conference on Quality, Reli...",28 Apr 2023,2022,2022.0,,1920,...,,,28 Apr 2023,,,IET,IET Conferences,29,"{'virtual', 'reality'}",2
101,52,Correction Method of Key Movements in Basketba...,Y. Huang; W. Yang,"Nan Chang Business, College of Jxau, Gongqingc...",2022 Global Reliability and Prognostics and He...,14 Nov 2022,2022,,,1,...,15.0,IEEE,14 Nov 2022,,,IEEE,IEEE Conferences,29,"{'virtual', 'reality'}",2
52,143,Touching The Droid: Understanding and Improvin...,F. Zhu; Z. Lyu; M. Sousa; T. Grossman,"Department of Computer Science, University of ...",2022 IEEE International Symposium on Mixed and...,27 Dec 2022,2022,,,807,...,52.0,IEEE,27 Dec 2022,,,IEEE,IEEE Conferences,29,"{'virtual', 'reality'}",2
63,27,Virtual Reality Experience in Tourism: A Facto...,L. Kusdibyo; A. Brien; R. Sutrisno; D. Suhartanto,"Politeknik Negeri Bandung,Department of Busine...",2021 IEEE International Conference on Industry...,17 Sep 2021,2021,,,27,...,29.0,IEEE,17 Sep 2021,,,IEEE,IEEE Conferences,29,"{'virtual', 'reality'}",2
54,141,Building Trust in Autonomous Vehicles: Role of...,L. Morra; F. Lamberti; F. G. Pratticó; S. L. R...,"Dipartimento di Automatica e Informatica, Poli...",IEEE Transactions on Vehicular Technology,21 Oct 2019,2019,68.0,10.0,9438,...,55.0,IEEE,6 Aug 2019,,,IEEE,IEEE Journals,29,"{'virtual', 'reality'}",2
79,39,The Difference in Measuring Reachability Dista...,W. Xiong; X. Yu; Y. -C. Lee,"School of Design, South China University of Te...",2020 IEEE 7th International Conference on Indu...,27 May 2020,2020,,,390,...,16.0,IEEE,27 May 2020,,,IEEE,IEEE Conferences,29,"{'virtual', 'reality'}",2


In [317]:
ieee_selected = ieee_papers_title_filters
advanced_ieee_filter= filter_papers(ieee_papers_title, search_keywords, 'Abstract', 40)

In [324]:
advanced_ieee_filter.head()

Unnamed: 0.1,Unnamed: 0,Document Title,Authors,Author Affiliations,Publication Title,Date Added To Xplore,Publication Year,Volume,Issue,Start Page,...,Reference Count,License,Online Date,Issue Date,Meeting Date,Publisher,Document Identifier,occurence,keywords,key_words_count
0,5,The Effect of Virtual Humans Making Verbal Com...,J. Stuart; K. Aul; M. D. Bumbach; A. Stephen; ...,University of Florida; University of Florida; ...,2022 IEEE Conference on Virtual Reality and 3D...,20 Apr 2022,2022,,,455,...,33.0,IEEE,20 Apr 2022,,,IEEE,IEEE Conferences,86,"{trustworthiness, reliability, credibility, mi...",6
76,42,Towards Artificial Intelligence Driven Immersi...,S. Alsaleh; A. Tepljakov; M. Tamre; E. Petlenkov,Department of Electrical Power Engineering and...,2021 44th International Conference on Telecomm...,30 Aug 2021,2021,,,340,...,16.0,IEEE,30 Aug 2021,,,IEEE,IEEE Conferences,57,"{immersion, virtual, reality, credibility}",4
12,112,Measurements of live actor motion in mixed rea...,G. Hough; I. Williams; C. Athwal,"Faculty of Technology, Engineering and the Env...",2014 IEEE International Symposium on Mixed and...,6 Nov 2014,2014,,,99,...,,IEEE,6 Nov 2014,,,IEEE,IEEE Conferences,57,"{mixed, virtual, reality, credibility}",4
43,184,Evaluation of the potential impact of fully-im...,A. Maffei; M. Onori,"Department of Production Engineering, KTH Roya...",2019 IEEE AFRICON,7 Jul 2020,2019,,,1,...,18.0,IEEE,7 Jul 2020,,,IEEE,IEEE Conferences,57,"{reliability, immersion, virtual, reality}",4
48,168,A Framework of Student's Learning Motivation i...,K. Cheng; A. M. Zaini; D. C. d. Wong; H. Chong...,"De Institute of Creative Arts and Design, UCSI...",2022 10th International Conference on Informat...,21 Oct 2022,2022,,,70,...,36.0,IEEE,21 Oct 2022,,,IEEE,IEEE Conferences,57,"{reliability, virtual, reality, credibility}",4


In [319]:
advanced_ieee_filter["Document Title"].iloc[50]

'Design and application of intelligent patrol system based on virtual reality'

#### Save the papers after the advanced the search


In [322]:
advanced_ieee_filter.to_csv("filtered_papers/final_ieee_papers.csv", index=False)

### Filtering the ACM papers with an acceptance occurence rate of 20%

In [327]:
acm_papers.sample(5)

Unnamed: 0,author(s),title,year,isbn,publisher,address,url,doi,abstract,booktitle,pages,numpages,keywords,location,series
183,"Stojmenovi\'{c}, Milica and Spero, Eric and St...",What is Beautiful is Secure,2022,,Association for Computing Machinery,2022,https://doi.org/10.1145/3533047,10.1145/3533047,Visual appeal has been shown to influence perc...,,,30,"Aesthetics, web certificates, visual appeal, h...",,
319,"Nisiotis, Louis and Kleanthous, Styliani",The Relationship Between Students' Engagement ...,2019,9781450368957.0,Association for Computing Machinery,2019,https://doi.org/10.1145/3304221.3319743,10.1145/3304221.3319743,The use of educational Multi-User Virtual Envi...,Proceedings of the 2019 ACM Conference on Inno...,71-77,7,"virtual worlds, engagement, transactive memory...","Aberdeen, Scotland Uk",ITiCSE '19
489,"Chowdhury, Abishi and Tripathi, Priyanka",A Novel Attempt towards Effective Scheduling B...,2014,9781450332163.0,Association for Computing Machinery,2014,https://doi.org/10.1145/2677855.2677891,10.1145/2677855.2677891,Cloud computing is now becoming a trend of mod...,Proceedings of the 2014 International Conferen...,,6,"Virtual Machine, Reliability, Priority, Datace...","Udaipur, Rajasthan, India",ICTCS '14
486,"Liu, Shudong and Li, Xiaoli and Xiang, Shili a...",Mobile Robot Routing with Energy Consumption O...,2020,9781450372350.0,Association for Computing Machinery,2020,https://doi.org/10.1145/3373724.3373739,10.1145/3373724.3373739,We consider scheduling mobile robots which are...,Proceedings of the 5th International Conferenc...,30-35,6,"Industrial internet of things, Intelligent man...","Singapore, Singapore",ICRAI '19
399,"White, Ryen W. and Hassan, Ahmed",Content Bias in Online Health Search,2014,,Association for Computing Machinery,2014,https://doi.org/10.1145/2663355,10.1145/2663355,Search engines help people answer consequentia...,,,33,"health search, Content biases",,


In [328]:
acm_papers.columns

Index(['author(s)', 'title', 'year', 'isbn', 'publisher', 'address', 'url',
       'doi', 'abstract', 'booktitle', 'pages', 'numpages', 'keywords',
       'location', 'series'],
      dtype='object')

In [329]:
acm_papers_title_filters = filter_papers(acm_papers, search_keywords, "title", 20)


In [333]:
acm_papers_title_filters.tail()

Unnamed: 0,author(s),title,year,isbn,publisher,address,url,doi,abstract,booktitle,pages,numpages,keywords,location,series,occurence,key_words_count
65,"Gomez-Rodriguez, Manuel",Distilling Information Reliability and Source ...,2017,9781450349147.0,International World Wide Web Conferences Steer...,2017,https://doi.org/10.1145/3041021.3054760,10.1145/3041021.3054760,Online knowledge repositories typically rely o...,Proceedings of the 26th International Conferen...,1513,1,"{reliability, trustworthiness}","Perth, Australia",WWW '17 Companion,29,2
66,"Tabibian, Behzad and Valera, Isabel and Farajt...",Distilling Information Reliability and Source ...,2017,9781450349130.0,International World Wide Web Conferences Steer...,2017,https://doi.org/10.1145/3038912.3052672,10.1145/3038912.3052672,Online knowledge repositories typically rely o...,Proceedings of the 26th International Conferen...,847-855,9,"{reliability, trustworthiness}","Perth, Australia",WWW '17,29,2
5,"Clark, Andrew and Pillay, Anban W. and Moodley...",A System for Pose Analysis and Selection in Vi...,2020,9781450388474.0,Association for Computing Machinery,2020,https://doi.org/10.1145/3410886.3410909,10.1145/3410886.3410909,Depth cameras provide a natural and intuitive ...,Conference of the South African Institute of C...,210-216,7,"{virtual, reality}","Cape Town, South Africa",SAICSIT '20,29,2
212,"Kawahara, Ayumu and Noguchi, Yohei and Tanaka,...",A Virtual Agent That is Equipped With Internal...,2022,,IEEE Press,2022,,,"When interacting with humans, virtual agents u...",Proceedings of the 2022 ACM/IEEE International...,844-846,3,"{virtual, credibility}","Sapporo, Hokkaido, Japan",HRI '22,29,2
960,"Cipresso, Pietro and Serino, Silvia and Pedrol...",Psychometric Reliability of the NeuroVR-Based ...,2013,9781936968800.0,"ICST (Institute for Computer Sciences, Social-...",2013,https://doi.org/10.4108/icst.pervasivehealth.2...,10.4108/icst.pervasivehealth.2013.252361,This stusdy aim at testing the psychometric re...,Proceedings of the 7th International Conferenc...,446-449,4,"{reliability, virtual}","Venice, Italy",PervasiveHealth '13,29,2


In [332]:
acm_papers_title_filters.shape

(24, 17)

In [334]:
acm_papers_title_filters.to_csv("acm_title_filters_result.csv")

#### Filtering Based on the Abstract, with acceptance occurence rate of more than 40%.

In [335]:
#load the acm title results that was saved
acm_title_results=pd.read_csv("acm_title_filters_result.csv")

In [338]:
acm_title_results.sample(5)

Unnamed: 0.1,Unnamed: 0,author(s),title,year,isbn,publisher,address,url,doi,abstract,booktitle,pages,numpages,keywords,location,series,occurence,key_words_count
7,687,"Pellegrini, Andrea and Greathouse, Joseph L. a...",Viper: Virtual Pipelines for Enhanced Reliability,2012,9781450000000.0,IEEE Computer Society,2012,,,The reliability of future processors is threat...,Proceedings of the 39th Annual International S...,344-355,12,"{'reliability', 'virtual'}","Portland, Oregon",ISCA '12,29,2
5,38,"Sendhilnathan, Naveen and Zhang, Ting and Lafr...",Detecting Input Recognition Errors and User Er...,2022,9781450000000.0,Association for Computing Machinery,2022,https://doi.org/10.1145/3526113.3545628,10.1145/3526113.3545628,Gesture-based recognition systems are suscepti...,Proceedings of the 35th Annual ACM Symposium o...,,19,"{'virtual', 'reality'}","Bend, OR, USA",UIST '22,29,2
1,22,"Suhonen, Katja and V\""{a}\""{a}n\""{a}nen-Vainio...",Two User Studies on Creation and Evaluation of...,2012,9781450000000.0,Association for Computing Machinery,2012,https://doi.org/10.1145/2254556.2254665,10.1145/2254556.2254665,Mixed reality (MR) technologies and applicatio...,Proceedings of the International Working Confe...,588-595,8,"{'mixed', 'reality'}","Capri Island, Italy",AVI '12,29,2
19,65,"Gomez-Rodriguez, Manuel",Distilling Information Reliability and Source ...,2017,9781450000000.0,International World Wide Web Conferences Steer...,2017,https://doi.org/10.1145/3041021.3054760,10.1145/3041021.3054760,Online knowledge repositories typically rely o...,Proceedings of the 26th International Conferen...,1513,1,"{'reliability', 'trustworthiness'}","Perth, Australia",WWW '17 Companion,29,2
0,13,"Houzangbe, Samory and Christmann, Olivier and ...",Integrability and Reliability of Smart Wearabl...,2018,9781450000000.0,Association for Computing Machinery,2018,https://doi.org/10.1145/3234253.3234305,10.1145/3234253.3234305,Virtual Reality (VR) is now an affordable tech...,Proceedings of the Virtual Reality Internation...,,6,"{'reliability', 'virtual', 'reality'}","Laval, France",VRIC '18,43,3


In [342]:
#filter on the abstract column
abstract_acm_filter= filter_papers(acm_title_results, search_keywords, 'abstract', 40)

In [344]:
abstract_acm_filter

Unnamed: 0.1,Unnamed: 0,author(s),title,year,isbn,publisher,address,url,doi,abstract,booktitle,pages,numpages,keywords,location,series,occurence,key_words_count
3,42,"Chakareski, Jacob and Khan, Mahmudur",Wifi-VLC Dual Connectivity Streaming System fo...,2021,9781450000000.0,Association for Computing Machinery,2021,https://doi.org/10.1145/3458306.3460999,10.1145/3458306.3460999,We investigate a future WiFi-VLC dual connecti...,Proceedings of the 31st ACM Workshop on Networ...,106-113,8,"{reliability, virtual, reality}","Istanbul, Turkey",NOSSDAV '21,43,3
4,40,"Zhang, Ting and Hu, Zhenhong and Gupta, Aakar ...",RIDS: Implicit Detection of a Selection Gestur...,2022,9781450000000.0,Association for Computing Machinery,2022,https://doi.org/10.1145/3526113.3545701,10.1145/3526113.3545701,Freehand interactions with augmented and virtu...,Proceedings of the 35th Annual ACM Symposium o...,,12,"{reliability, virtual, reality}","Bend, OR, USA",UIST '22,43,3
1,22,"Suhonen, Katja and V\""{a}\""{a}n\""{a}nen-Vainio...",Two User Studies on Creation and Evaluation of...,2012,9781450000000.0,Association for Computing Machinery,2012,https://doi.org/10.1145/2254556.2254665,10.1145/2254556.2254665,Mixed reality (MR) technologies and applicatio...,Proceedings of the International Working Confe...,588-595,8,"{reliability, mixed, reality}","Capri Island, Italy",AVI '12,43,3


In [345]:
abstract_acm_filter.to_csv("filtered_papers/final_acm_papers.csv", index=False)