## Arxiv Paper Dataframe by Crawling

<br>

In [None]:
%pip install arxiv
%pip install clipboard
%pip install pyautogui

In [1]:
import re
import tqdm
import arxiv
import clipboard
import pyautogui
import pandas as pd
import numpy as np
from datetime import datetime
from datetime import timedelta

In [4]:
def make_arxiv_paper_df_with_abstract(paper_ids):

    arxiv_paper_df_with_abstract = pd.DataFrame({'Title':['Noun'],
                               'Journal/Conference':['Noun'],
                               'Date':['Noun'], 
                               'Author':['Noun'],
                               'Link':['Noun'],
                               'Abstract':['Noun']})
    client = arxiv.Client()
    
    pbar = tqdm.tqdm(paper_ids)

    for idx, paper_id in enumerate(pbar):
        search = arxiv.Search(id_list=[paper_id])
        paper = next(client.results(search))
        
        paper_journal_conf = re.search(r'[A-Z ]+[0-9]+[0-9]+[0-9]+[0-9]', str(paper.comment))
        if paper_journal_conf != None:
            paper_journal_conf = paper_journal_conf.group().strip()
            if len(paper_journal_conf) > 4:
                if paper_journal_conf[-4] != " ":
                    paper_journal_conf = paper_journal_conf[:-4] + " " + paper_journal_conf[-4:]
                else:
                    paper_journal_conf = paper_journal_conf
            elif len(paper_journal_conf) <= 4:
                paper_journal_conf = ""
        elif paper_journal_conf == None:
            paper_journal_conf = ""

        arxiv_paper_df_with_abstract.loc[idx] = [paper.title, 
                                paper_journal_conf,
                                paper.published.date(), 
                                str(paper.authors[0]) + ' et al',
                                    paper.entry_id,
                                    paper.summary]
    pbar.close()
    
    arxiv_paper_df_with_abstract = pd.DataFrame(arxiv_paper_df_with_abstract.sort_values(by='Date').reset_index()).drop(['index'], axis='columns')
    arxiv_paper_df_with_abstract.index = np.arange(1, len(arxiv_paper_df_with_abstract) + 1)         
    
    return arxiv_paper_df_with_abstract

In [5]:
def str_convert_datetime(date):
    return datetime.strptime(date, '%Y-%m-%d').date()

In [6]:
def add_other_papers_column(arxiv_paper_df_with_abstract, other_papers):
  
  df_length = len(arxiv_paper_df_with_abstract) - 1

  pbar = tqdm.tqdm(other_papers)

  for other_paper in pbar:
    df_length += 1
    arxiv_paper_df_with_abstract.loc[df_length] = other_paper
  
  arxiv_paper_df_with_abstract = pd.DataFrame(arxiv_paper_df_with_abstract.sort_values(by='Date').reset_index()).drop(['index'], axis='columns')
  arxiv_paper_df_with_abstract.index = np.arange(1, len(arxiv_paper_df_with_abstract) + 1)  
  
  pbar.close()
  
  return arxiv_paper_df_with_abstract

In [7]:
def hyperlink(x):
    hyperlink= '[Link]' + '(' + x + ')'
    return hyperlink

In [8]:
def input_jouranl_conference_theme(arxiv_paper_df_with_abstract):

    paper_title = arxiv_paper_df_with_abstract['Title']
    paper_journal_conference = arxiv_paper_df_with_abstract['Journal/Conference']
    arxiv_paper_df_with_abstract['Theme'] = ""
    paper_theme = arxiv_paper_df_with_abstract['Theme']

    pyautogui.alert('Input Paper Jouranl Conference')

    for index, (title, journal_conference) in enumerate(zip(paper_title, paper_journal_conference)):

        if len(journal_conference) < 2:
            clipboard.copy(title)
            input_journal_conference = input("{} For {}: ".format("Input Journal & Conference", title)) 
            arxiv_paper_df_with_abstract.loc[index, 'Journal/Conference'] = input_journal_conference

    pyautogui.alert('Input Paper Title')

    for index, (title, theme) in enumerate(zip(paper_title, paper_theme)):

        if len(theme) < 2:
            clipboard.copy(title)
            input_theme = input("{} For {}: ".format("Input Theme", title)) 
            arxiv_paper_df_with_abstract.loc[index, 'Theme'] = input_theme

    arxiv_paper_df_with_abstract = arxiv_paper_df_with_abstract[['Title', 'Journal/Conference', 'Date', 'Author', 'Theme', 'Link', 'Abstract']]

    return arxiv_paper_df_with_abstract

In [9]:
def make_arxiv_paper_df_with_abstract_by_theme(theme_order, arxiv_paper_df_with_abstract):

    def sorter(column):
        mapper = {name: order for order, name in enumerate(theme_order)}
        return column.map(mapper)

    arxiv_paper_df_with_abstract_by_theme = arxiv_paper_df_with_abstract.sort_values(by=['Theme', 'Date'], key=sorter, ascending=True).reset_index() 
    del arxiv_paper_df_with_abstract_by_theme['index']
    arxiv_paper_df_with_abstract_by_theme.index += 1 
    arxiv_paper_df_with_abstract_by_theme = arxiv_paper_df_with_abstract_by_theme.set_index('Theme', append=True).swaplevel(0, 1)

    return arxiv_paper_df_with_abstract_by_theme

In [11]:
def make_arxiv_paper_df(arxiv_paper_df_with_abstract):

    arxiv_paper_df_with_abstract = pd.DataFrame(arxiv_paper_df_with_abstract.sort_values(by='Date').reset_index()).drop(['index'], axis='columns')
    arxiv_paper_df_with_abstract.index = np.arange(1, len(arxiv_paper_df_with_abstract) + 1)    
    arxiv_paper_df = arxiv_paper_df_with_abstract.drop(['Abstract'], axis='columns')

    return arxiv_paper_df

In [12]:
def make_arxiv_paper_df_by_theme(arxiv_paper_df_with_abstract_by_theme):
  
    arxiv_paper_df_by_theme = arxiv_paper_df_with_abstract_by_theme.drop(['Abstract'], axis='columns')

    return arxiv_paper_df_by_theme

In [12]:
paper_ids = ["1409.0473v7", "1409.3215v3", "1706.03762v5", "1609.08144v2",
             "1508.07909v5", "1301.3781v3", "1808.06226v1", "1802.05365v2",
             "1810.04805v2", "2104.02395v3", "2202.07105v2", "1503.02531v1",
             "1910.01108v4", "1908.09355v1", "2008.05030v4", "1603.08983v6",
             "1709.01686v1", "1804.07461v3", "1902.03393v2", "2004.02178v2",
             "2002.10957v2", "2012.15828v2", "1707.07328v1", "1612.00796v2",
             "1806.00451v1", "2106.04570v3", "1703.03400v3", "1604.00289v3",
             "2004.09602v1", "1603.01025v2", "1308.3432v1", "1909.05840v2",
             "1712.05877v1", "1811.08886v3", "1502.03044v3", "1907.05686v5", 
             "2203.06390v1", "1609.07061v1", "1911.09464v2", "2103.13630v3",
             "1603.05279v4", "1906.05714v1", "1905.03197v3", "1907.10529v3",
             "1910.13461v1", "2007.10760v3", "2008.00312", "1803.06535",
             "1705.09655", "1312.6114", "1606.03657", "2103.04264",
             "1902.06531", "2004.06660", "1908.10084", "1905.10447",
             "2006.01043", "1408.5882", "2301.10602", "1810.10191",
             "1509.02971", "1802.09464", "2109.11234", "1707.06347",
             "2006.01043", "1408.5882", "2301.10602", "1810.10191",
             "1710.02298", "1312.5602", "1712.00378", "2210.03992",
             "2305.17416", "1705.00106", "1806.03822", "1910.10683",
             "2109.01652", "2210.03992", "2212.10560", "2302.13971",
             "1909.06951", "1705.00106", "1806.03822", "1910.10683",
             "2109.01652", "2210.03992", "2212.10560", "2302.13971",
             "2304.03277", "2305.11206", "2305.14314", "2305.14152",
             "2204.07705", "2305.17002", "2302.02210", "2203.11086",
             "2010.11929", "2012.12877", "1606.06160", "2211.16056",
             "2003.03488", "2004.03333", "2106.08295", "2101.01321",
             "2004.04136", "2305.15077", "2106.07345", "2104.08821",
             "1607.00325", "2110.06296", "2010.15703", "1711.06077",
             "1903.06733", "2006.04884", "1804.00247", "1706.02677",
             "2004.08249", "1711.00489", "1803.09820", "2012.15701",
             "2205.13016", "1902.08153", "1603.05279", "2206.01861",
             "2209.13325", "2304.09145", "2301.12017", "2306.00317",
             "2305.17888", "1902.08153", "1603.05279", "2206.01861",
             "2209.13325", "1911.12491"]

arxiv_paper_df_with_abstract = make_arxiv_paper_df_with_abstract(paper_ids)

  0%|          | 0/134 [00:00<?, ?it/s]

100%|██████████| 134/134 [07:48<00:00,  3.50s/it]


In [13]:
other_papers = [["Model Compression", "ACM SIGKDD 2006", str_convert_datetime("2006-08-20"),
                "Cristian Bucil˘a et al", "https://dl.acm.org/doi/abs/10.1145/1150402.1150464", 
                "Often the best performing supervised learning models are ensembles of hundreds or thousands of base-level classifiers. Unfortunately, the space required to store this many classifiers, and the time required to execute them at run-time, prohibits their use in applications where test sets are large (e.g. Google), where storage space is at a premium (e.g. PDAs), and where computational power is limited (e.g. hea-ring aids). We present a method for 'compressing' large, complex ensembles into smaller, faster models, usually without significant loss in performance."],
                ["Adaptive Mixtures of Local Experts", "MIT Press 1991", str_convert_datetime("1991-03-01"),
                "Robert A. Jacobs et al", "https://ieeexplore.ieee.org/abstract/document/6797059", 
                "We present a new supervised learning procedure for systems composed of many separate networks, each of which learns to handle a subset of the complete set of training cases. The new procedure can be viewed either as a modular version of a multilayer supervised network, or as an associative version of competitive learning. It therefore provides a new link between these two apparently different approaches. We demonstrate that the learning procedure divides up a vowel discrimination task into appropriate subtasks, each of which can be solved by a very simple expert network."],
                ["Dropout: A Simple Way to Prevent Neural Networks from Overfitting", "JMLR 2014", str_convert_datetime("2014-01-01"),
                "Nitish Srivastava et al", "https://ieeexplore.ieee.org/abstract/document/6797059", 
                "Deep neural nets with a large number of parameters are very powerful machine learning systems. However, overfitting is a serious problem in such networks. Large networks are also slow to use, making it difficult to deal with overfitting by combining the predictions of many different large neural nets at test time. Dropout is a technique for addressing this problem. The key idea is to randomly drop units (along with their connections) from the neural network during training. This prevents units from co-adapting too much. During training, dropout samples from an exponential number of different âthinnedâ networks. At test time, it is easy to approximate the effect of averaging the predictions of all these thinned networks by simply using a single unthinned network that has smaller weights. This significantly reduces overfitting and gives major improvements over other regularization methods. We show that dropout improves the performance of neural networks on supervised learning tasks in vision, speech recognition, document classification and computational biology, obtaining state-of-the-art results on many benchmark data sets."],
                ["Linguistic Regularities in Continuous Space Word Representations", "NAACL 2013", str_convert_datetime("2013-06-01"),
                "Tomas Mikolov et al", "https://aclanthology.org/N13-1090/", 
                "Continuous space language models have recently demonstrated outstanding results across a variety of tasks. In this paper, we examine the vector-space word representations that are implicitly learned by the input-layer weights. We find that these representations are surprisingly good at capturing syntactic and semantic regularities in language, and that each relationship is characterized by a relation-specific vector offset. This allows vector-oriented reasoning based on the offsets between words. For example, the male/female relationship is automatically learned, and with the induced vector representations, “King - Man + Woman” results in a vector very close to “Queen.” We demonstrate that the word vectors capture syntactic regularities by means of syntactic analogy questions (provided with this paper), and are able to correctly answer almost 40% of the questions. We demonstrate that the word vectors capture semantic regularities by using the vector offset method to answer SemEval-2012 Task 2 questions. Remarkably, this method outperforms the best previous systems."],
                 ["Large-Scale Distributed Language Modeling", "IEEE 2007", str_convert_datetime("2007-04-05"),
                "Ahmad Emami et al", "https://ieeexplore.ieee.org/document/4218031", 
                "A novel distributed language model that has no constraints on the n-gram order and no practical constraints on vocabulary size is presented. This model is scalable and allows for an arbitrarily large corpus to be queried for statistical estimates. Our distributed model is capable of producing n-gram counts on demand. By using a novel heuristic estimate for the interpolation weights of a linearly interpolated model, it is possible to dynamically compute the language model probabilities. The distributed architecture follows the client-server paradigm and allows for each client to request an arbitrary weighted mixture of the corpus. This allows easy adaptation of the language model to particular test conditions. Experiments using the distributed LM for re-ranking N-best lists of a speech recognition system resulted in considerable improvements in word error rate (WER), while integration with a machine translation decoder resulted in significant improvements in translation quality as measured by the BLEU score."],
                 ["BLEU: a method for automatic evaluation of machine translation", "ACL 2002", str_convert_datetime("2002-07-01"),
                "Kishore Papineni et al", "https://dl.acm.org/doi/10.3115/1073083.1073135", 
                "Human evaluations of machine translation are extensive but expensive. Human evaluations can take months to finish and involve human labor that can not be reused. We propose a method of automatic machine translation evaluation that is quick, inexpensive, and language-independent, that correlates highly with human evaluation, and that has little marginal cost per run. We present this method as an automated understudy to skilled human judges which substitutes for them when there is need for quick or frequent evaluations."],
                ["Large Language Models in Machine Translation", "EMNLP 2007", str_convert_datetime("2007-06-01"),
                "Gloria Brown Wright et al", "https://aclanthology.org/D07-1090/", 
                "This paper reports on the benefits of largescale statistical language modeling in machine translation. A distributed infrastructure is proposed which we use to train onup to 2 trillion tokens, resulting in languagemodels having up to 300 billion n-grams. Itis capable of providing smoothed probabilities for fast, single-pass decoding. We introduce a new smoothing method, dubbedStupid Backoff, that is inexpensive to trainon large data sets and approaches the qualityof Kneser-Ney Smoothing as the amount oftraining data increases."],
                ["Student-Centered Learning in Higher Education", " ", str_convert_datetime("2011-01-01"),
                "Thorsten Brants et al", "https://files.eric.ed.gov/fulltext/EJ938583.pdf", 
                "In her book, Learner-Centered Teaching, Maryellen Weimer contrasts the practices of teachercentered college teaching and student-centered college teaching in terms of (1) the balance of power in the classroom, (2) the function of the course content, (3) the role of the teacher versus the role of the student, (4) the responsibility of learning, (5) the purpose and processes of evaluation. She then gives some suggestions on how to implement the learner-centered approach. Using Weimer’s five specifications, it has been possible to identify from the pedagogical literature several examples where college teachers are seeking to move toward more student-centered classrooms. This essay reports on innovations used by teachers across the academic and professional spectrum, as well as on their evaluations of their successes."],
                ["Optimization as A Model for Few-shot Learning", "ICLR 2017", str_convert_datetime("2017-07-22"),
                "Sachin Ravi et al", "https://openreview.net/forum?id=rJY0-Kcll", 
                "Though deep neural networks have shown great success in the large data domain, they generally perform poorly on few-shot learning tasks, where a model has to quickly generalize after seeing very few examples from each class. The general belief is that gradient-based optimization in high capacity models requires many iterative steps over many examples to perform well. Here, we propose an LSTM-based meta-learner model to learn the exact optimization algorithm used to train another learner neural network in the few-shot regime. The parametrization of our model allows it to learn appropriate parameter updates specifically for the scenario where a set amount of updates will be made, while also learning a general initialization of the learner network that allows for quick convergence of training. We demonstrate that this meta-learning model is competitive with deep metric-learning techniques for few-shot learning."],
                ["Language Models are Unsupervised Multitask Learners", " ", str_convert_datetime("2019-06-01"),
                "Alec Radford et al", "https://www.semanticscholar.org/paper/Language-Models-are-Unsupervised-Multitask-Learners-Radford-Wu/9405cc0d6169988371b2755e573cc28650d14dfe", 
                "Natural language processing tasks, such as question answering, machine translation, reading comprehension, and summarization, are typically approached with supervised learning on taskspecific datasets. We demonstrate that language models begin to learn these tasks without any explicit supervision when trained on a new dataset of millions of webpages called WebText. When conditioned on a document plus questions, the answers generated by the language model reach 55 F1 on the CoQA dataset matching or exceeding the performance of 3 out of 4 baseline systems without using the 127,000+ training examples. The capacity of the language model is essential to the success of zero-shot task transfer and increasing it improves performance in a log-linear fashion across tasks. Our largest model, GPT-2, is a 1.5B parameter Transformer that achieves state of the art results on 7 out of 8 tested language modeling datasets in a zero-shot setting but still underfits WebText. Samples from the model reflect these improvements and contain coherent paragraphs of text. These findings suggest a promising path towards building language processing systems which learn to perform tasks from their naturally occurring demonstrations."],
                ["BadNets: Evaluating Backdooring Attacks on Deep Neural Networks", "IEEE Access 2019", str_convert_datetime("2019-04-11"),
                "Tianyu Gu et al", "https://ieeexplore.ieee.org/document/8685687", 
                "Deep learning-based techniques have achieved state-of-the-art performance on a wide variety of recognition and classification tasks."],
                ["Neural Cleanse: Identifying and Mitigating Backdoor Attacks in Neural Networks", "IEEE Symposium on Security and Privacy (SP) 2019", str_convert_datetime("2019-01-01"),
                "Bolun Wang et al", "https://www.computer.org/csdl/proceedings-article/sp/2019/666000a707/1dlwir1mwFi", 
                "Lack of transparency in deep neural networks (DNNs) make them susceptible to backdoor attacks, where hidden associations or triggers override normal classification to produce unexpected results."],
                ["SoMoGym: A Toolkit for Developing and Evaluating Controllers and Reinforcement Learning Algorithms for Soft Robots", "IEEE Robotics and Automation Letters 2022", str_convert_datetime("2022-01-01"),
                "Moritz A. Graule et al", "https://ieeexplore.ieee.org/document/9707663", 
                "Soft robots offer a host of benefits over traditional rigid robots, including inherent compliance that lets them passively adapt to variable environments and operate safely around humans and fragile objects."],
                ["Goal Density based Hindsight Experience Prioritization for Multi Goal Robot Manipulation Reinforcement Learning", "IEEE International Workshop on Robot and Human Communication (ROMAN) 2020", str_convert_datetime("2020-09-04"),
                "Yingyi Kuang et al", "https://ieeexplore.ieee.org/document/9223473", 
                "Reinforcement learning for multi-goal robot manipulation tasks is usually challenging, especially when sparse rewards are provided."],
                ["Augmenting Vision-Based Grasp Plans for Soft Robotic Grippers using Reinforcement Learning", "IEEE 18th International Conference on Automation Science and Engineering (CASE) 2022", str_convert_datetime("2022-08-24"),
                "Vighnesh Vatsal et al", "https://ieeexplore.ieee.org/document/9926580", 
                "Vision-based techniques for grasp planning of robotic end-effectors have been successfully deployed in pick-and-place tasks."],
                ["Learning-Based Slip Detection for Robotic Fruit Grasping and Manipulation under Leaf Interference", "AI-Based Sensors and Sensing Systems for Smart Agriculture) 2022", str_convert_datetime("2022-06-01"),
                "Hongyu Zhou et al", "https://www.mdpi.com/1424-8220/22/15/5483", 
                "Robotic harvesting research has seen significant achievements in the past decade, with breakthroughs being made in machine vision, robot manipulation, autonomous navigation and mapping."],
                ["Reward is enough", "Artificial Intelligenc Volume 299", str_convert_datetime("2021-10-01"),
                "David Silver et al", "https://www.sciencedirect.com/science/article/pii/S0004370221000862", 
                "In this article we hypothesise that intelligence, and its associated abilities, can be understood as subserving the maximisation of reward."],
                ["Hierarchical Attention Networks for Document Classification", "ACL 2016", str_convert_datetime("2016-01-01"),
                "Zichao Yang et al", "https://aclanthology.org/N16-1174/", 
                "We propose a hierarchical attention network for document classification."],
                ["ROUGE: A Package for Automatic Evaluation of Summaries", "Artificial Intelligenc Volume 299", str_convert_datetime("2021-10-01"),
                "Chin-Yew Lin et al", "https://aclanthology.org/W04-1013/", 
                "ROUGE stands for Recall-Oriented Understudy for Gisting Evaluation."],
                ["Post-Training with Interrogative Sentences for Enhancing BART-based Korean Question Generator", "ACL 2022", str_convert_datetime("2022-01-01"),
                "Gyu-Min Park et al", "https://aclanthology.org/2022.aacl-short.26/", 
                "The pre-trained language models such as KoBART often fail in generating perfect interrogative sentences when they are applied to Korean question generation."],
                ["Dialog-Post Multi-Level Self-Supervised Objectives and Hierarchical Model for Dialogue Post-Training", "ACL 2023", str_convert_datetime("2023-01-01"),
                "Zhenyu Zhang et al", "https://aclanthology.org/2023.acl-long.564/", 
                "Dialogue representation and understanding aim to convert conversational inputs into embeddings and fulfill discriminative tasks."],
                ["Improving Transformer Optimization Through Better Initialization", "ICML 2020", str_convert_datetime("2020-01-01"),
                "Xiao Shi Huang et al", "https://proceedings.mlr.press/v119/huang20f.html", 
                "We propose a hierarchical attention network for document classification."]
                ]

arxiv_paper_df_with_abstract = add_other_papers_column(arxiv_paper_df_with_abstract, other_papers)

100%|██████████| 22/22 [00:00<00:00, 785.80it/s]


In [14]:
arxiv_paper_df_with_abstract["Link"] = arxiv_paper_df_with_abstract["Link"].apply(hyperlink)

In [17]:
arxiv_paper_df_with_abstract = input_jouranl_conference_theme(arxiv_paper_df_with_abstract)

In [10]:
theme_order = ["Neural Network", "Benchmark", "Word Embedding", "Explainable Artificial Intelligence (XAI)",
            "Language Model", "Pre-Trained Language Model", "Multimodal Learning", "Image Classification",
            "Machine Translation", "Natural Language Understanding (NLU)", "Text Generation",
            "Meta Learning", "Continual Learning", "Mixture of Experts", "Ensemble",
            "Model Compression", "Knoweldge Distillation", "Quantization", "Pruning",
            "Low-Rank Factorization", "Early Exit", "Reinforcement Learning", "Security", "Computer Vision"]

arxiv_paper_df_with_abstract_by_theme = make_arxiv_paper_df_with_abstract_by_theme(theme_order, arxiv_paper_df_with_abstract)

In [13]:
arxiv_paper_df = make_arxiv_paper_df(arxiv_paper_df_with_abstract)
arxiv_paper_df_by_theme = make_arxiv_paper_df_by_theme(arxiv_paper_df_with_abstract_by_theme)

In [8]:
arxiv_paper_df_with_abstract

Unnamed: 0.1,Unnamed: 0,Title,Journal/Conference,Date,Author,Theme,Link,Abstract
0,1,Adaptive Mixtures of Local Experts,MIT Press 1991,1991-03-01,Robert A. Jacobs et al,Mixture of Experts,[Link](https://ieeexplore.ieee.org/abstract/do...,We present a new supervised learning procedure...
1,2,BLEU: a method for automatic evaluation of mac...,ACL 2002,2002-07-01,Kishore Papineni et al,Benchmark,[Link](https://dl.acm.org/doi/10.3115/1073083....,Human evaluations of machine translation are e...
2,3,Model Compression,ACM SIGKDD 2006,2006-08-20,Cristian Bucil˘a et al,Model Compression,[Link](https://dl.acm.org/doi/abs/10.1145/1150...,Often the best performing supervised learning ...
3,4,Large-Scale Distributed Language Modeling,IEEE 2007,2007-04-05,Ahmad Emami et al,Language Model,[Link](https://ieeexplore.ieee.org/document/42...,A novel distributed language model that has no...
4,5,Large Language Models in Machine Translation,Teaching and Learning in Higher Education,2007-06-01,Gloria Brown Wright et al,Machine Translation,[Link](https://aclanthology.org/D07-1090/),This paper reports on the benefits of largesca...
...,...,...,...,...,...,...,...,...
132,133,QLoRA: Efficient Finetuning of Quantized LLMs,EMNLP 2023,2023-05-23,Tim Dettmers et al,Quantization,[Link](http://arxiv.org/abs/2305.14314v1),"We present QLoRA, an efficient finetuning appr..."
133,134,Contrastive Learning of Sentence Embeddings fr...,,2023-05-24,Junlei Zhang et al,Word Embedding,[Link](http://arxiv.org/abs/2305.15077v2),Contrastive learning has been the dominant app...
134,135,An Empirical Comparison of LM-based Question a...,ACL 2023,2023-05-26,Asahi Ushio et al,Language Model,[Link](http://arxiv.org/abs/2305.17002v1),Question and answer generation (QAG) consists ...
135,136,A Practical Toolkit for Multilingual Question ...,,2023-05-27,Asahi Ushio et al,Language Model,[Link](http://arxiv.org/abs/2305.17416v1),Generating questions along with associated ans...


In [14]:
arxiv_paper_df_with_abstract_by_theme

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 0,Title,Journal/Conference,Date,Author,Link,Abstract
Theme,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
Neural Network,1,11,Dropout: A Simple Way to Prevent Neural Networ...,JMLR 2014,2014-01-01,Nitish Srivastava et al,[Link](https://ieeexplore.ieee.org/abstract/do...,Deep neural nets with a large number of parame...
Neural Network,2,12,Convolutional Neural Networks for Sentence Cla...,EMNLP 2014,2014-08-25,Yoon Kim et al,[Link](http://arxiv.org/abs/1408.5882v2),We report on a series of experiments with conv...
Neural Network,3,20,Convolutional Neural Networks using Logarithmi...,,2016-03-03,Daisuke Miyashita et al,[Link](http://arxiv.org/abs/1603.01025v2),Recent advances in convolutional neural networ...
Neural Network,4,26,Permutation Invariant Training of Deep Models ...,,2016-07-01,Dong Yu et al,[Link](http://arxiv.org/abs/1607.00325v2),"We propose a novel deep learning model, which ..."
Neural Network,5,33,"Accurate, Large Minibatch SGD: Training ImageN...",NeurIPS 2017,2017-06-08,Priya Goyal et al,[Link](http://arxiv.org/abs/1706.02677v2),Deep learning thrives with large neural networ...
...,...,...,...,...,...,...,...,...
Computer Vision,133,41,The Perception-Distortion Tradeoff,CVPR 2018,2017-11-16,Yochai Blau et al,[Link](http://arxiv.org/abs/1711.06077v4),Image restoration algorithms are typically eva...
Computer Vision,134,50,Do CIFAR-10 Classifiers Generalize to CIFAR-10?,,2018-06-01,Benjamin Recht et al,[Link](http://arxiv.org/abs/1806.00451v1),Machine learning is currently dominated by lar...
Computer Vision,135,54,Making Sense of Vision and Touch: Self-Supervi...,ICRA 2019,2018-10-24,Michelle A. Lee et al,[Link](http://arxiv.org/abs/1810.10191v2),Contact-rich manipulation tasks in unstructure...
Computer Vision,136,92,An Image is Worth 16x16 Words: Transformers fo...,CVPR 2021,2020-10-22,Alexey Dosovitskiy et al,[Link](http://arxiv.org/abs/2010.11929v2),While the Transformer architecture has become ...


In [15]:
arxiv_paper_df_with_abstract.to_excel("arxiv_paper_df_with_abstract.xlsx")
arxiv_paper_df.to_excel("arxiv_paper_df.xlsx")
# arxiv_paper_df_with_abstract = pd.read_excel("arxiv_paper_df_with_abstract.xlsx", engine='openpyxl')

arxiv_paper_df_with_abstract_by_theme.to_excel("arxiv_paper_df_with_abstract_by_theme.xlsx")
arxiv_paper_df_by_theme.to_excel("arxiv_paper_df_by_theme.xlsx")
# arxiv_paper_df_with_abstract_by_theme = pd.read_excel("arxiv_paper_df_with_abstract_by_theme.xlsx", engine='openpyxl')

### Upload Dataframe on Github

[Excel to Markdown Converter](https://tabletomarkdown.com/convert-spreadsheet-to-markdown/)