# Samples

In [1]:
hf_dataset = 'paperswithcode_aspects'
nlp_cache_dir = './data/nlp_cache'

index_dir = './output/pwc/whoosh_index'
tensorboard_dir = './output/pwc/tensorboard'

# SPECTER
general_fp = './output/pwc/specter.w2v.txt'  

# Fine-tuned Sentence-SciBERT
task_fp = './output/pwc/task/1/st_scibert-scivocab-uncased/pwc_id2vec__all_docs.w2v.txt'  # pwc_id2vec__train_and_test.w2v.txt  
method_fp = './output/pwc/method/1/st_scibert-scivocab-uncased/pwc_id2vec__all_docs.w2v.txt' 
dataset_fp = './output/pwc/dataset/1/st_scibert-scivocab-uncased/pwc_id2vec__all_docs.w2v.txt' 


In [2]:
sample_ids = [
    'V9yaFJy03j', # Data augmentation for low resource sentiment analysis using generative adversarial networks
    '9rB_3A5Wy0',  # Sentiment Analysis of German Twitter
    'N0jcCtrbqO',  # Fake News in Social Networks
]

In [3]:
from gensim.models import KeyedVectors
import os
import random
import sys
import numpy as np
import pandas as pd
from collections import defaultdict
from datasets import load_dataset
from experiments.utils import get_local_hf_dataset_path
from fuzzywuzzy import fuzz, process
from tqdm.auto import tqdm
from paperswithcode import Paper
from IPython.core.display import display, HTML



In [4]:
general_vecs = KeyedVectors.load_word2vec_format(general_fp)
task_vecs = KeyedVectors.load_word2vec_format(task_fp)
method_vecs = KeyedVectors.load_word2vec_format(method_fp)
dataset_vecs = KeyedVectors.load_word2vec_format(dataset_fp)

# Normalize vectors
general_vecs.init_sims(replace=True)
task_vecs.init_sims(replace=True)
method_vecs.init_sims(replace=True)
dataset_vecs.init_sims(replace=True)

In [5]:
# Load meta data
docs_ds = load_dataset(get_local_hf_dataset_path(hf_dataset),
                       name='docs',
                       cache_dir=nlp_cache_dir,
                          split='docs')

Reusing dataset pwc_aspects (./data/nlp_cache/pwc_aspects/docs/0.1.0/5a02274a50cfdd54f404ef512e5453e7f1a9db1cef85c4ae2ecd4607bc43943e)


In [6]:
paper_id2paper = {p['paper_id']: Paper(**p) for p in docs_ds}

In [7]:
# Find neighbors
max_abstract_length = 200
top_k = 5

def get_html(rank, paper, score=0., show_details=True):  
    details_html = f'''
        <p style="margin: 0; padding: 0; font-size: 1.1rem">
        <b>Tasks:</b> {", ".join(paper.aspect_tasks)}
        <b>Methods:</b> {", ".join(paper.aspect_methods)}
        <b>Datasets:</b> {", ".join(paper.aspect_datasets)}
        </p><p>
        {paper.abstract[:max_abstract_length]} <a href="#" onclick="$('#abstract_{paper.paper_id}').toggle();">...</a>
        <span id="abstract_{paper.paper_id}" style="display:none">{paper.abstract[max_abstract_length:]}</span>
        </div>
        ''' if show_details else ''
        
    return f'''
        <div>
        <h3>{rank}. <a href="{paper.paper_url}">{paper.title}</a> <small style="background: #eee">{score:.3f}</small></h3>
        {details_html}
        </div>
        '''
    

def get_col(nn, rank, show_details=True):
    pid, score = nn[rank - 1]
    return f'<td style="vertical-align: top">{get_html(rank, paper_id2paper[pid], score, show_details)}</td>'

def get_multi_view_html(seed_id, show_details=True):

    general_nn = list(general_vecs.most_similar(seed_id, topn=top_k))
    task_nn = list(task_vecs.most_similar(seed_id, topn=top_k))
    method_nn = list(method_vecs.most_similar(seed_id, topn=top_k))
    dataset_nn = list(dataset_vecs.most_similar(seed_id, topn=top_k))
    col_width = '25%'

    results_html = get_html('Seed', paper_id2paper[seed_id]) + ' <hr />'
    
    results_html += f'''
    <table><thead><tr>
    <th width="{col_width}">General purpose</th>
    <th width="{col_width}">Task-related</th>
    <th width="{col_width}">Method-related</th>
    <th width="{col_width}">Dataset-related</th>
    </thead><tbody>
    '''

    for rank in range(1, top_k+1):
        results_html += f'<tr style="vertical-align: top">'
        results_html += get_col(general_nn, rank, show_details)
        results_html += get_col(task_nn, rank, show_details)
        results_html += get_col(method_nn, rank, show_details)
        results_html += get_col(dataset_nn, rank, show_details)

        results_html += f'</tr>'

        #break

    results_html += '</tbody></table>'

    return results_html


## Select samples

In [8]:
for pid in sample_ids:
    display(HTML(get_multi_view_html(pid, show_details=True)))

General purpose,Task-related,Method-related,Dataset-related
"1. Adversarial Training for Aspect-Based Sentiment Analysis with BERT 0.846  Tasks: Aspect-Based Sentiment Analysis, Aspect Extraction, Language Modelling, Sentiment Analysis  Methods: Residual Connection, Attention Dropout, Linear Warmup With Linear Decay, Weight Decay, GELU, Dense Connections, Adam, WordPiece, Softmax, Dropout, Multi-Head Attention, Layer Normalization, Scaled Dot-Product Attention, BERT  Datasets: SemEval 2014 Task 4 Sub Task 2  Aspect-Based Sentiment Analysis (ABSA) deals with the extraction of sentiments and their targets. Collecting labeled data for this task in order to help neural networks generalize better can be labori ...","1. Not Enough Data? Deep Learning to the Rescue! 0.987  Tasks: Data Augmentation, Language Modelling, Text Classification, Text Generation  Methods: Datasets: Based on recent advances in natural language modeling and those in text generation capabilities, we propose a novel data augmentation method for text classification tasks. We use a powerful pre-traine ...","1. DNA Methylation Data to Predict Suicidal and Non-Suicidal Deaths: A Machine Learning Approach 0.980  Tasks: Data Visualization, Dimensionality Reduction  Methods: PCA  Datasets: The objective of this study is to predict suicidal and non-suicidal deaths from DNA methylation data using a modern machine learning algorithm. We used support vector machines to classify existing sec ...","1. Semi-supervised and Transfer learning approaches for low resource sentiment classification 0.989  Tasks: Sentiment Analysis, Transfer Learning  Methods: Datasets: Sentiment classification involves quantifying the affective reaction of a human to a document, media item or an event. Although researchers have investigated several methods to reliably infer sentimen ..."
"2. Data Augmentation in Emotion Classification Using Generative Adversarial Networks 0.821  Tasks: Data Augmentation, Emotion Classification  Methods: Datasets: It is a difficult task to classify images with multiple class labels using only a small number of labeled examples, especially when the label (class) distribution is imbalanced. Emotion classification ...","2. Text Data Augmentation: Towards better detection of spear-phishing emails 0.986  Tasks: Data Augmentation, Language Modelling, Machine Translation, Question Answering, Text Augmentation, Text Classification  Methods: Multi-Head Attention, Residual Connection, Scaled Dot-Product Attention, Attention Dropout, Weight Decay, Adam, Softmax, WordPiece, Dense Connections, Layer Normalization, GELU, Linear Warmup With Linear Decay, Dropout, BERT  Datasets: Text data augmentation, i.e. the creation of synthetic textual data from an original text, is challenging as augmentation transformations should take into account language complexity while being relev ...","2. Company classification using machine learning 0.979  Tasks: Decision Making, Dimensionality Reduction, Portfolio Optimization  Methods: Datasets: The recent advancements in computational power and machine learning algorithms have led to vast improvements in manifold areas of research. Especially in finance, the application of machine learning e ...","2. Affection Driven Neural Networks for Sentiment Analysis 0.988  Tasks: Sentiment Analysis  Methods: Sigmoid Activation, Tanh Activation, LSTM  Datasets: Deep neural network models have played a critical role in sentiment analysis with promising results in the recent decade. One of the essential challenges, however, is how external sentiment knowledge ..."
"3. Hierarchical Attention Generative Adversarial Networks for Cross-domain Sentiment Classification 0.817  Tasks: Domain Adaptation, Sentiment Analysis  Methods: Datasets: Cross-domain sentiment classification (CDSC) is an importance task in domain adaptation and sentiment classification. Due to the domain discrepancy, a sentiment classifier trained on source domain dat ...","3. Conditional BERT Contextual Augmentation 0.986  Tasks: Data Augmentation, Language Modelling, Text Classification  Methods: Residual Connection, Attention Dropout, Linear Warmup With Linear Decay, Weight Decay, GELU, Dense Connections, Adam, WordPiece, Softmax, Dropout, Multi-Head Attention, Layer Normalization, Scaled Dot-Product Attention, BERT  Datasets: We propose a novel data augmentation method for labeled sentences called conditional BERT contextual augmentation. Data augmentation methods are often applied to prevent overfitting and improve genera ...",3. Inductive Hashing on Manifolds 0.977  Tasks: Methods: Datasets: Learning based hashing methods have attracted considerable attention due to their ability to greatly increase the scale at which existing algorithms may operate. Most of these methods are designed to ...,"3. Learning representations for sentiment classification using Multi-task framework 0.987  Tasks: Multi-Task Learning, Sentiment Analysis  Methods: Datasets: Most of the existing state of the art sentiment classification techniques involve the use of pre-trained embeddings. This paper postulates a generalized representation that collates training on multip ..."
"4. Semi-supervised and Transfer learning approaches for low resource sentiment classification 0.816  Tasks: Sentiment Analysis, Transfer Learning  Methods: Datasets: Sentiment classification involves quantifying the affective reaction of a human to a document, media item or an event. Although researchers have investigated several methods to reliably infer sentimen ...","4. Improving short text classification through global augmentation methods 0.986  Tasks: Text Augmentation, Text Classification  Methods: Datasets: We study the effect of different approaches to text augmentation. To do this we use 3 datasets that include social media and formal text in the form of news articles. Our goal is to provide insights f ...",4. t-SNE-CUDA: GPU-Accelerated t-SNE and its Applications to Modern Data 0.976  Tasks: Dimensionality Reduction  Methods: Datasets: Modern datasets and models are notoriously difficult to explore and analyze due to their inherent high dimensionality and massive numbers of samples. Existing visualization methods which employ dimens ...,"4. Learning with Noisy Labels for Sentence-level Sentiment Classification 0.986  Tasks: Learning with noisy labels, Sentiment Analysis  Methods: Datasets: Deep neural networks (DNNs) can fit (or even over-fit) the training data very well. If a DNN model is trained using data with noisy labels and tested on data with clean labels, the model may perform p ..."
"5. On Enhancing Speech Emotion Recognition using Generative Adversarial Networks 0.815  Tasks: Emotion Recognition, Speech Emotion Recognition  Methods: Convolution, GAN  Datasets: Generative Adversarial Networks (GANs) have gained a lot of attention from machine learning community due to their ability to learn and mimic an input data distribution. GANs consist of a discriminato ...","5. Contextual Augmentation: Data Augmentation by Words with Paradigmatic Relations 0.985  Tasks: Data Augmentation, Language Modelling, Text Augmentation, Text Classification  Methods: Datasets: We propose a novel data augmentation for labeled sentences called contextual augmentation. We assume an invariance that sentences are natural even if the words in the sentences are replaced with other ...","5. Hashing on Nonlinear Manifolds 0.975  Tasks: Image Classification, Quantization, Semantic Retrieval  Methods: Datasets: Learning based hashing methods have attracted considerable attention due to their ability to greatly increase the scale at which existing algorithms may operate. Most of these methods are designed to ...","5. Complementary Fusion of Multi-Features and Multi-Modalities in Sentiment Analysis 0.986  Tasks: Emotion Recognition, Multimodal Emotion Recognition, Multimodal Sentiment Analysis, Sentiment Analysis  Methods: Datasets: Sentiment analysis, mostly based on text, has been rapidly developing in the last decade and has attracted widespread attention in both academia and industry. However, the information in the real worl ..."


General purpose,Task-related,Method-related,Dataset-related
"1. Comparing methods for Twitter Sentiment Analysis 0.873  Tasks: Sentiment Analysis, Twitter Sentiment Analysis  Methods: SVM, Logistic Regression  Datasets: This work extends the set of works which deal with the popular problem of sentiment analysis in Twitter. It investigates the most popular document (""tweet"") representation methods which feed sentiment ...","1. Opinion Mining on Non-English Short Text 0.993  Tasks: Opinion Mining, Sentiment Analysis  Methods: Datasets: As the type and the number of such venues increase, automated analysis of sentiment on textual resources has become an essential data mining task. In this paper, we investigate the problem of mining o ...","1. VICTOR: a Dataset for Brazilian Legal Documents Classification 0.986  Tasks: Methods: Datasets: BVICTOR, MVICTOR (theme), SVICTOR (theme), MVICTOR (type), SVICTOR (type)  This paper describes VICTOR, a novel dataset built from Brazil{'}s Supreme Court digitalized legal documents, composed of more than 45 thousand appeals, which includes roughly 692 thousand documents{- ...","1. A Simple Approach to Multilingual Polarity Classification in Twitter 0.988  Tasks: Sentiment Analysis  Methods: Datasets: Recently, sentiment analysis has received a lot of attention due to the interest in mining opinions of social media users. Sentiment analysis consists in determining the polarity of a given text, i.e. ..."
"2. A Simple Approach to Multilingual Polarity Classification in Twitter 0.863  Tasks: Sentiment Analysis  Methods: Datasets: Recently, sentiment analysis has received a lot of attention due to the interest in mining opinions of social media users. Sentiment analysis consists in determining the polarity of a given text, i.e. ...","2. A Scalable, Lexicon Based Technique for Sentiment Analysis 0.992  Tasks: Opinion Mining, Sentiment Analysis  Methods: Datasets: Rapid increase in the volume of sentiment rich social media on the web has resulted in an increased interest among researchers regarding Sentimental Analysis and opinion mining. However, with so much ...",2. Semi-supervised Named Entity Recognition in noisy-text 0.984  Tasks: Named Entity Recognition  Methods: Dropout  Datasets: Many of the existing Named Entity Recognition (NER) solutions are built based on news corpus data with proper syntax. These solutions might not lead to highly accurate results when being applied to no ...,"2. Using Hadoop for Large Scale Analysis on Twitter: A Technical Report 0.988  Tasks: Decision Making, Opinion Mining, Sentiment Analysis  Methods: Datasets: Sentiment analysis (or opinion mining) on Twitter data has attracted much attention recently. One of the system's key features, is the immediacy in communication with other users in an easy, user-frie ..."
"3. Generating Sentiment Lexicons for German Twitter 0.846  Tasks: Methods: Datasets: Despite a substantial progress made in developing new sentiment lexicon generation (SLG) methods for English, the task of transferring these approaches to other languages and domains in a sound way st ...","3. Adapting Freely Available Resources to Build an Opinion Mining Pipeline in Portuguese 0.991  Tasks: Named Entity Recognition, Opinion Mining, Part-Of-Speech Tagging, Sentiment Analysis  Methods: Datasets: We present a complete UIMA-based pipeline for sentiment analysis in Portuguese news using freely available resources and a minimal set of manually annotated training data. We obtained good precision o ...","3. Corpus Creation and Analysis for Named Entity Recognition in Telugu-English Code-Mixed Social Media Data 0.982  Tasks: Entity Extraction using GAN, Named Entity Recognition  Methods: Datasets: Named Entity Recognition(NER) is one of the important tasks in Natural Language Processing(NLP) and also is a subtask of Information Extraction. In this paper we present our work on NER in Telugu-Engl ...","3. An Arabic Tweets Sentiment Analysis Dataset (ATSAD) using Distant Supervision and Self Training 0.988  Tasks: Arabic Sentiment Analysis, Sentiment Analysis  Methods: Datasets: As the number of social media users increases, they express their thoughts, needs, socialise and publish their opinions reviews. For good social media sentiment analysis, good quality resources are ne ..."
"4. Approaches for Sentiment Analysis on Twitter: A State-of-Art study 0.844  Tasks: Opinion Mining, Sentiment Analysis  Methods: Datasets: Microbloging is an extremely prevalent broadcast medium amidst the Internet fraternity these days. People share their opinions and sentiments about variety of subjects like products, news, institution ...","4. Sentiment Analysis for Low Resource Languages: A Study on Informal Indonesian Tweets 0.991  Tasks: Sentiment Analysis  Methods: Datasets: This paper describes our attempt to build a sentiment analysis system for Indonesian tweets. With this system, we can study and identify sentiments and opinions in a text or document computationally. ...","4. An Empirical Study of Discriminative Sequence Labeling Models for Vietnamese Text Processing 0.981  Tasks: Feature Engineering, Named Entity Recognition, Part-Of-Speech Tagging, Word Embeddings  Methods: Datasets: This paper presents an empirical study of two widely-used sequence prediction models, Conditional Random Fields (CRFs) and Long Short-Term Memory Networks (LSTMs), on two fundamental tasks for Vietnam ...","4. Sentiment Analysis for Hinglish Code-mixed Tweets by means of Cross-lingual Word Embeddings 0.987  Tasks: Sentiment Analysis, Transfer Learning, Word Embeddings  Methods: Datasets: This paper investigates the use of unsupervised cross-lingual embeddings for solving the problem of code-mixed social media text understanding. We specifically investigate the use of these embeddings ..."
"5. Sentiment Analysis For Modern Standard Arabic And Colloquial 0.843  Tasks: Arabic Sentiment Analysis, Sentiment Analysis  Methods: SVM  Datasets: The rise of social media such as blogs and social networks has fueled interest in sentiment analysis. With the proliferation of reviews, ratings, recommendations and other forms of online expression, ...","5. Sentiment Analysis Using Collaborated Opinion Mining 0.991  Tasks: Opinion Mining, Sentiment Analysis  Methods: Datasets: Opinion mining and Sentiment analysis have emerged as a field of study since the widespread of World Wide Web and internet. Opinion refers to extraction of those lines or phrase in the raw and huge da ...","5. Discourse-Aware Rumour Stance Classification in Social Media Using Sequential Classifiers 0.981  Tasks: Stance Classification  Methods: Sigmoid Activation, Tanh Activation, LSTM  Datasets: Rumour stance classification, defined as classifying the stance of specific social media posts into one of supporting, denying, querying or commenting on an earlier post, is becoming of increasing int ...","5. Comparing and Combining Sentiment Analysis Methods 0.987  Tasks: Sentiment Analysis  Methods: Datasets: Several messages express opinions about events, products, and services, political views or even their author's emotional state and mood. Sentiment analysis has been used in several applications includ ..."


General purpose,Task-related,Method-related,Dataset-related
"1. Lean From Thy Neighbor: Stochastic & Adversarial Bandits in a Network 0.791  Tasks: Decision Making  Methods: Datasets: An individual's decisions are often guided by those of his or her peers, i.e., neighbors in a social network. Presumably, being privy to the experiences of others aids in learning and decision making, ...","1. Defending Against Neural Fake News 0.998  Tasks: Fake News Detection, Text Generation  Methods: Datasets: Grover-Mega  Recent progress in natural language generation has raised dual-use concerns. While applications like summarization and translation are positive, the underlying technology also might enable adversaries ...","1. Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics 0.986  Tasks: Transfer Learning  Methods: Datasets: Learning robot tasks or controllers using deep reinforcement learning has been proven effective in simulations. Learning in simulation has several advantages. For example, one can fully control the si ...","1. Credulous Users and Fake News: a Real Case Study on the Propagation in Twitter 0.981  Tasks: Fake News Detection  Methods: Datasets: Recent studies have confirmed a growing trend, especially among youngsters, of using Online Social Media as favourite information platform at the expense of traditional mass media. Indeed, they can ea ..."
"2. Incentivizing Exploration with Selective Data Disclosure 0.789  Tasks: Methods: Datasets: We study the design of rating systems that incentivize (more) efficient social learning among self-interested agents. Agents arrive sequentially and are presented with a set of possible actions, each ...","2. DeHiDe: Deep Learning-based Hybrid Model to Detect Fake News using Blockchain 0.997  Tasks: Methods: Datasets: The surge in the spread of misleading information, lies, propaganda, and false facts, frequently known as fake news, raised questions concerning social media's influence in today's fast-moving democra ...","2. Robust Recovery Controller for a Quadrupedal Robot using Deep Reinforcement Learning 0.986  Tasks: Methods: Datasets: The ability to recover from a fall is an essential feature for a legged robot to navigate in challenging environments robustly. Until today, there has been very little progress on this topic. Current ...","2. Where Are the Facts? Searching for Fact-checked Information to Alleviate the Spread of Fake News 0.980  Tasks: Ad-Hoc Information Retrieval, Fact Verification, Fake News Detection, Image Matting, misinformation, Text Matching  Methods: Datasets: Although many fact-checking systems have been developed in academia and industry, fake news is still proliferating on social media. These systems mostly focus on fact-checking but usually neglect onli ..."
"3. Online discrete optimization in social networks in the presence of Knightian uncertainty 0.786  Tasks: Decision Making  Methods: Datasets: We study a model of collective real-time decision-making (or learning) in a social network operating in an uncertain environment, for which no a priori probabilistic model is available. Instead, the e ...",3. News Labeling as Early as Possible: Real or Fake? 0.997  Tasks: Methods: Datasets: Making disguise between real and fake news propagation through online social networks is an important issue in many applications. The time gap between the news release time and detection of its label ...,"3. Acceleration of Actor-Critic Deep Reinforcement Learning for Visual Grasping in Clutter by State Representation Learning Based on Disentanglement of a Raw Input Image 0.986  Tasks: Representation Learning, Robotic Grasping  Methods: Datasets: For a robotic grasping task in which diverse unseen target objects exist in a cluttered environment, some deep learning-based methods have achieved state-of-the-art results using visual input directly ...","3. Balancing information exposure in social networks 0.979  Tasks: Methods: Datasets: Social media has brought a revolution on how people are consuming news. Beyond the undoubtedly large number of advantages brought by social-media platforms, a point of criticism has been the creation ..."
4. Beliefs in Decision-Making Cascades 0.785  Tasks: Decision Making  Methods: Datasets: This work explores a social learning problem with agents having nonidentical noise variances and mismatched beliefs. We consider an $N$-agent binary hypothesis test in which each agent sequentially ma ...,"4. Credulous Users and Fake News: a Real Case Study on the Propagation in Twitter 0.997  Tasks: Fake News Detection  Methods: Datasets: Recent studies have confirmed a growing trend, especially among youngsters, of using Online Social Media as favourite information platform at the expense of traditional mass media. Indeed, they can ea ...","4. FORECASTER: A Continual Lifelong Learning Approach to Improve Hardware Efficiency 0.986  Tasks: Methods: Datasets: Computer applications are continuously evolving. However, significant knowledge can be harvested from older applications or versions and applied in the context of newer applications or versions. Such ...","4. Leveraging the Crowd to Detect and Reduce the Spread of Fake News and Misinformation 0.978  Tasks: misinformation, Point Processes  Methods: Datasets: Online social networking sites are experimenting with the following crowd-powered procedure to reduce the spread of fake news and misinformation: whenever a user is exposed to a story through her feed ..."
"5. Learning without Recall by Random Walks on Directed Graphs 0.783  Tasks: Bayesian Inference  Methods: Datasets: We consider a network of agents that aim to learn some unknown state of the world using private observations and exchange of beliefs. At each time, agents observe private signals generated based on th ...","5. Attributed Multi-Relational Attention Network for Fact-checking URL Recommendation 0.997  Tasks: Recommendation Systems  Methods: Datasets: To combat fake news, researchers mostly focused on detecting fake news and journalists built and maintained fact-checking sites (e.g., Snopes.com and Politifact.com). However, fake news dissemination ...","5. Continuous State-Space Models for Optimal Sepsis Treatment - a Deep Reinforcement Learning Approach 0.985  Tasks: Decision Making  Methods: Datasets: Sepsis is a leading cause of mortality in intensive care units (ICUs) and costs hospitals billions annually. Treating a septic patient is highly challenging, because individual patients respond very d ...",5. Online Learning and Optimization Under a New Linear-Threshold Model with Negative Influence 0.976  Tasks: Methods: Datasets: We propose a new class of Linear Threshold Model-based information-diffusion model that incorporates the formation and spread of negative attitude. We call such models negativity-aware.. We show that ...


## Random samples

In [10]:
random_ids = random.sample(list(paper_id2paper.keys()), 3)

for pid in random_ids:
    display(HTML(get_multi_view_html(pid, show_details=True)))

General purpose,Task-related,Method-related,Dataset-related
"1. Bank distress in the news: Describing events through deep learning 0.792  Tasks: Methods: Datasets: While many models are purposed for detecting the occurrence of significant events in financial systems, the task of providing qualitative detail on the developments is not usually as well automated. W ...","1. Bank distress in the news: Describing events through deep learning 0.982  Tasks: Methods: Datasets: While many models are purposed for detecting the occurrence of significant events in financial systems, the task of providing qualitative detail on the developments is not usually as well automated. W ...","1. Jointly Learning to Detect Emotions and Predict Facebook Reactions 0.978  Tasks: Emotion Classification  Methods: Datasets: The growing ubiquity of Social Media data offers an attractive perspective for improving the quality of machine learning-based models in several fields, ranging from Computer Vision to Natural Languag ...",1. Deep learning bank distress from news and numerical financial data 0.979  Tasks: Methods: Datasets: In this paper we focus our attention on the exploitation of the information contained in financial news to enhance the performance of a classifier of bank distress. Such information should be analyzed ...
2. Deep learning bank distress from news and numerical financial data 0.790  Tasks: Methods: Datasets: In this paper we focus our attention on the exploitation of the information contained in financial news to enhance the performance of a classifier of bank distress. Such information should be analyzed ...,"2. Firms Default Prediction with Machine Learning 0.979  Tasks: Methods: Datasets: Academics and practitioners have studied over the years models for predicting firms bankruptcy, using statistical and machine-learning approaches. An earlier sign that a company has financial difficul ...","2. Multimodal Sentiment Analysis To Explore the Structure of Emotions 0.978  Tasks: Multimodal Sentiment Analysis, Sentiment Analysis  Methods: Datasets: We propose a novel approach to multimodal sentiment analysis using deep neural networks combining visual analysis and natural language processing. Our goal is different than the standard sentiment ana ...","2. Detect & Describe: Deep learning of bank stress in the news 0.969  Tasks: Methods: Datasets: News is a pertinent source of information on financial risks and stress factors, which nevertheless is challenging to harness due to the sparse and unstructured nature of natural text. We propose an a ..."
"3. Earnings Prediction with Deep Learning 0.765  Tasks: Methods: Convolution  Datasets: In the financial sector, a reliable forecast the future financial performance of a company is of great importance for investors' investment decisions. In this paper we compare long-term short-term mem ...",3. Deep learning bank distress from news and numerical financial data 0.979  Tasks: Methods: Datasets: In this paper we focus our attention on the exploitation of the information contained in financial news to enhance the performance of a classifier of bank distress. Such information should be analyzed ...,"3. Mining Public Opinion on Twitter about Natural Disaster Response Using Machine Learning Techniques 0.977  Tasks: Disaster Response, Sentiment Analysis, Time Series  Methods: Datasets: With the development of the Internet, social media has become an essential channel for posting disaster-related information. Analyzing attitudes hidden in these texts, known as sentiment analysis, is ...","3. Firms Default Prediction with Machine Learning 0.966  Tasks: Methods: Datasets: Academics and practitioners have studied over the years models for predicting firms bankruptcy, using statistical and machine-learning approaches. An earlier sign that a company has financial difficul ..."
4. What You Say and How You Say It Matters: Predicting Stock Volatility Using Verbal and Vocal Cues 0.758  Tasks: Methods: Datasets: Predicting financial risk is an essential task in financial market. Prior research has shown that textual information in a firm{'}s financial statement can be used to predict its stock{'}s risk level. ...,4. Proficiency Comparison of LADTree and REPTree Classifiers for Credit Risk Forecast 0.979  Tasks: Methods: Datasets: Predicting the Credit Defaulter is a perilous task of Financial Industries like Banks. Ascertaining non-payer before giving loan is a significant and conflict-ridden task of the Banker. Classification ...,"4. A personal model of trumpery: Deception detection in a real-world high-stakes setting 0.976  Tasks: Deception Detection  Methods: Datasets: Language use reveals information about who we are and how we feel1-3. One of the pioneers in text analysis, Walter Weintraub, manually counted which types of words people used in medical interviews an ...","4. Bank distress in the news: Describing events through deep learning 0.965  Tasks: Methods: Datasets: While many models are purposed for detecting the occurrence of significant events in financial systems, the task of providing qualitative detail on the developments is not usually as well automated. W ..."
"5. The value of text for small business default prediction: A deep learning approach 0.756  Tasks: Methods: Residual Connection, Attention Dropout, Linear Warmup With Linear Decay, Weight Decay, GELU, Dense Connections, Adam, WordPiece, Softmax, Dropout, Multi-Head Attention, Layer Normalization, Scaled Dot-Product Attention, BERT  Datasets: Compared to consumer lending, Micro, Small and Medium Enterprise (mSME) credit risk modelling is particularly challenging, as, often, the same sources of information are not available. It is, therefor ...","5. The value of text for small business default prediction: A deep learning approach 0.977  Tasks: Methods: Residual Connection, Attention Dropout, Linear Warmup With Linear Decay, Weight Decay, GELU, Dense Connections, Adam, WordPiece, Softmax, Dropout, Multi-Head Attention, Layer Normalization, Scaled Dot-Product Attention, BERT  Datasets: Compared to consumer lending, Micro, Small and Medium Enterprise (mSME) credit risk modelling is particularly challenging, as, often, the same sources of information are not available. It is, therefor ...","5. Top Comment or Flop Comment? Predicting and Explaining User Engagement in Online News Discussions 0.976  Tasks: Methods: Datasets: Comment sections below online news articles enjoy growing popularity among readers. However, the overwhelming number of comments makes it infeasible for the average news consumer to read all of them a ...","5. Modeling Institutional Credit Risk with Financial News 0.964  Tasks: Methods: Datasets: Credit risk management, the practice of mitigating losses by understanding the adequacy of a borrower's capital and loan loss reserves, has long been imperative to any financial institution's long-ter ..."


General purpose,Task-related,Method-related,Dataset-related
"1. Guided Dyna-Q for Mobile Robot Exploration and Navigation 0.811  Tasks: Methods: Datasets: Model-based reinforcement learning (RL) enables an agent to learn world models from trial-and-error experiences toward achieving long-term goals. Automated planning, on the other hand, can be used for ...","1. Interactive Gibson Benchmark: A Benchmark for Interactive Navigation in Cluttered Environments 0.997  Tasks: Robot Navigation  Methods: Datasets: We present Interactive Gibson Benchmark, the first comprehensive benchmark for training and evaluating Interactive Navigation: robot navigation strategies where physical interaction with objects is al ...","1. TPO: TREE SEARCH POLICY OPTIMIZATION FOR CONTINUOUS ACTION SPACES 0.989  Tasks: Methods: Entropy Regularization, PPO  Datasets: Monte Carlo Tree Search (MCTS) has achieved impressive results on a range of discrete environments, such as Go, Mario and Arcade games, but it has not yet fulfilled its true potential in continuous do ...","1. Interactive Gibson Benchmark: A Benchmark for Interactive Navigation in Cluttered Environments 0.980  Tasks: Robot Navigation  Methods: Datasets: We present Interactive Gibson Benchmark, the first comprehensive benchmark for training and evaluating Interactive Navigation: robot navigation strategies where physical interaction with objects is al ..."
"2. APPLD: Adaptive Planner Parameter Learning from Demonstration 0.811  Tasks: Robot Navigation  Methods: Datasets: Existing autonomous robot navigation systems allow robots to move from one point to another in a collision-free manner. However, when facing new environments, these systems generally require re-tuning ...","2. L2B: Learning to Balance the Safety-Efficiency Trade-off in Interactive Crowd-aware Robot Navigation 0.995  Tasks: Robot Navigation  Methods: Datasets: This work presents a deep reinforcement learning framework for interactive navigation in a crowded place. Our proposed approach, Learning to Balance (L2B) framework enables mobile robot agents to stee ...","2. Policy Optimization with Model-based Explorations 0.988  Tasks: Atari Games, Decision Making  Methods: Entropy Regularization, PPO  Datasets: Model-free reinforcement learning methods such as the Proximal Policy Optimization algorithm (PPO) have successfully applied in complex decision-making problems such as Atari games. However, these met ...","2. Counterfactual Reasoning about Intent for Interactive Navigation in Dynamic Environments 0.979  Tasks: Decision Making, Motion Planning, Robot Navigation, Visual Tracking  Methods: Datasets: Many modern robotics applications require robots to function autonomously in dynamic environments including other decision making agents, such as people or other robots. This calls for fast and scalab ..."
"3. ReLMoGen: Leveraging Motion Generation in Reinforcement Learning for Mobile Manipulation 0.810  Tasks: Continuous Control, Hierarchical Reinforcement Learning  Methods: Datasets: Many Reinforcement Learning (RL) approaches use joint control signals (positions, velocities, torques) as action space for continuous control tasks. We propose to lift the action space to a higher lev ...","3. ReLMoGen: Leveraging Motion Generation in Reinforcement Learning for Mobile Manipulation 0.995  Tasks: Continuous Control, Hierarchical Reinforcement Learning  Methods: Datasets: Many Reinforcement Learning (RL) approaches use joint control signals (positions, velocities, torques) as action space for continuous control tasks. We propose to lift the action space to a higher lev ...","3. Towards Model-based Reinforcement Learning for Industry-near Environments 0.988  Tasks: Q-Learning  Methods: AutoEncoder, Entropy Regularization, PPO  Datasets: Deep reinforcement learning has over the past few years shown great potential in learning near-optimal control in complex simulated environments with little visible information. Rainbow (Q-Learning) a ...","3. DeFINE: Delayed Feedback based Immersive Navigation Environment for Studying Goal-Directed Human Navigation 0.979  Tasks: Methods: Datasets: With the advent of consumer-grade products for presenting an immersive virtual environment (VE), there is a growing interest in utilizing VEs for testing human navigation behavior. However, preparing ..."
"4. Motion Planner Augmented Reinforcement Learning for Robot Manipulation in Obstructed Environments 0.794  Tasks: Methods: Datasets: Deep reinforcement learning (RL) agents are able to learn contact-rich manipulation tasks by maximizing a reward signal, but require large amounts of experience, especially in environments with many o ...","4. The StreetLearn Environment and Dataset 0.986  Tasks: Decision Making  Methods: Datasets: Navigation is a rich and well-grounded problem domain that drives progress in many different areas of research: perception, planning, memory, exploration, and optimisation in particular. Historically ...","4. Queueing Network Controls via Deep Reinforcement Learning 0.987  Tasks: Methods: Entropy Regularization, PPO  Datasets: Novel advanced policy gradient (APG) methods, such as Trust Region policy optimization and Proximal policy optimization (PPO), have become the dominant reinforcement learning algorithms because of the ...","4. MINOS: Multimodal Indoor Simulator for Navigation in Complex Environments 0.978  Tasks: Methods: Datasets: We present MINOS, a simulator designed to support the development of multisensory models for goal-directed navigation in complex indoor environments. The simulator leverages large datasets of complex ..."
5. Human-Interactive Subgoal Supervision for Efficient Inverse Reinforcement Learning 0.789  Tasks: Methods: Datasets: Humans are able to understand and perform complex tasks by strategically structuring the tasks into incremental steps or subgoals. For a robot attempting to learn to perform a sequential task with cri ...,5. Sim-to-Real Transfer with Incremental Environment Complexity for Reinforcement Learning of Depth-Based Robot Navigation 0.985  Tasks: Robot Navigation  Methods: Datasets: Transferring learning-based models to the real world remains one of the hardest problems in model-free control theory. Due to the cost of data collection on a real robot and the limited sample efficie ...,"5. Optimization and passive flow control using single-step deep reinforcement learning 0.987  Tasks: Methods: Entropy Regularization, PPO  Datasets: This research gauges the ability of deep reinforcement learning (DRL) techniques to assist the optimization and control of fluid mechanical systems. It combines a novel, ""degenerate"" version of the pr ...","5. L2B: Learning to Balance the Safety-Efficiency Trade-off in Interactive Crowd-aware Robot Navigation 0.977  Tasks: Robot Navigation  Methods: Datasets: This work presents a deep reinforcement learning framework for interactive navigation in a crowded place. Our proposed approach, Learning to Balance (L2B) framework enables mobile robot agents to stee ..."


General purpose,Task-related,Method-related,Dataset-related
"1. Convolutional LSTM Network: A Machine Learning Approach for Precipitation Nowcasting 0.852  Tasks: Weather Forecasting  Methods: Convolution, ConvLSTM, Sigmoid Activation, Tanh Activation, LSTM  Datasets: The goal of precipitation nowcasting is to predict the future rainfall intensity in a local region over a relatively short period of time. Very few previous studies have examined this crucial and chal ...",1. Statistical post-processing of wind speed forecasts using convolutional neural networks 0.998  Tasks: Weather Forecasting  Methods: Datasets: Current statistical post-processing methods for probabilistic weather forecasting are not capable of using full spatial patterns from the numerical weather prediction (NWP) model. In this paper we inc ...,"1. Statistical Downscaling of Temperature Distributions from the Synoptic Scale to the Mesoscale Using Deep Convolutional Neural Networks 0.980  Tasks: Methods: Datasets: Deep learning, particularly convolutional neural networks for image recognition, has been recently used in meteorology. One of the promising applications is developing a statistical surrogate model th ...","1. A framework for probabilistic weather forecast post-processing across models and lead times using machine learning 0.983  Tasks: Decision Making  Methods: Datasets: Forecasting the weather is an increasingly data intensive exercise. Numerical Weather Prediction (NWP) models are becoming more complex, with higher resolutions, and there are increasing numbers of di ..."
"2. Spatio-Temporal Graph Convolutional Networks: A Deep Learning Framework for Traffic Forecasting 0.834  Tasks: Time Series, Time Series Prediction, Traffic Prediction  Methods: Datasets: METR-LA, PeMS-M  Timely accurate traffic forecast is crucial for urban traffic control and guidance. Due to the high nonlinearity and complexity of traffic flow, traditional methods cannot satisfy the requirements of ...","2. Deep multi-stations weather forecasting: explainable recurrent convolutional neural networks 0.998  Tasks: Weather Forecasting  Methods: Convolution, Sigmoid Activation, Tanh Activation, LSTM  Datasets: Deep learning applied to weather forecasting has started gaining popularity because of the progress achieved by data-driven models. The present paper compares four different deep learning architecture ...","2. Explainable Failure Predictions with RNN Classifiers based on Time Series Data 0.979  Tasks: Time Series  Methods: Datasets: Given key performance indicators collected with fine granularity as time series, our aim is to predict and explain failures in storage environments. Although explainable predictive modeling based on s ...","2. Deep multi-stations weather forecasting: explainable recurrent convolutional neural networks 0.981  Tasks: Weather Forecasting  Methods: Convolution, Sigmoid Activation, Tanh Activation, LSTM  Datasets: Deep learning applied to weather forecasting has started gaining popularity because of the progress achieved by data-driven models. The present paper compares four different deep learning architecture ..."
"3. Deep multi-stations weather forecasting: explainable recurrent convolutional neural networks 0.832  Tasks: Weather Forecasting  Methods: Convolution, Sigmoid Activation, Tanh Activation, LSTM  Datasets: Deep learning applied to weather forecasting has started gaining popularity because of the progress achieved by data-driven models. The present paper compares four different deep learning architecture ...","3. Weather Forecasting Error in Solar Energy Forecasting 0.998  Tasks: Weather Forecasting  Methods: Datasets: As renewable distributed energy resources (DERs) penetrate the power grid at an accelerating speed, it is essential for operators to have accurate solar photovoltaic (PV) energy forecasting for effici ...","3. Physics Guided Recurrent Neural Networks For Modeling Dynamical Systems: Application to Monitoring Water Temperature And Quality In Lakes 0.979  Tasks: Methods: Datasets: In this paper, we introduce a novel framework for combining scientific knowledge within physics-based models and recurrent neural networks to advance scientific discovery in many dynamical systems. We ...","3. Neural networks for post-processing ensemble weather forecasts 0.981  Tasks: Methods: Datasets: Ensemble weather predictions require statistical post-processing of systematic errors to obtain reliable and accurate probabilistic forecasts. Traditionally, this is accomplished with distributional r ..."
"4. Precipitation Nowcasting: Leveraging bidirectional LSTM and 1D CNN 0.826  Tasks: Time Series, Time Series Forecasting, Weather Forecasting  Methods: Sigmoid Activation, Tanh Activation, LSTM  Datasets: Short-term rainfall forecasting, also known as precipitation nowcasting has become a potentially fundamental technology impacting significant real-world applications ranging from flight safety, rainst ...",4. Improving data-driven global weather prediction using deep convolutional neural networks on a cubed sphere 0.998  Tasks: Weather Forecasting  Methods: Convolution  Datasets: We present a significantly-improved data-driven global weather forecasting framework using a deep convolutional neural network (CNN) to forecast several basic atmospheric variables on a global grid. N ...,"4. STFNets: Learning Sensing Signals from the Time-Frequency Perspective with Short-Time Fourier Neural Networks 0.978  Tasks: Speech Recognition  Methods: Datasets: Recent advances in deep learning motivate the use of deep neural networks in Internet-of-Things (IoT) applications. These networks are modelled after signal processing in the human brain, thereby lead ...","4. WeatherBench: A benchmark dataset for data-driven weather forecasting 0.981  Tasks: Weather Forecasting  Methods: Linear Regression  Datasets: Data-driven approaches, most prominently deep learning, have become powerful tools for prediction in many domains. A natural question to ask is whether data-driven methods could also be used to predic ..."
"5. Diffusion Convolutional Recurrent Neural Network: Data-Driven Traffic Forecasting 0.815  Tasks: Multivariate Time Series Forecasting, Spatio-Temporal Forecasting, Time Series, Time Series Forecasting, Time Series Prediction, Traffic Prediction  Methods: Datasets: METR-LA, PeMS-M  Spatiotemporal forecasting has various applications in neuroscience, climate and transportation domain. Traffic forecasting is one canonical example of such learning task. The task is challenging due ...","5. Detecting Comma-shaped Clouds for Severe Weather Forecasting using Shape and Motion 0.998  Tasks: Weather Forecasting  Methods: Datasets: Meteorologists use shapes and movements of clouds in satellite images as indicators of several major types of severe storms. Satellite imaginary data are in increasingly higher resolution, both spatia ...","5. Correlated Time Series Forecasting using Deep Neural Networks: A Summary of Results 0.978  Tasks: Multi-Task Learning, Time Series, Time Series Forecasting  Methods: Datasets: Cyber-physical systems often consist of entities that interact with each other over time. Meanwhile, as part of the continued digitization of industrial processes, various sensor technologies are depl ...","5. Smart Weather Forecasting Using Machine Learning:A Case Study in Tennessee 0.980  Tasks: Weather Forecasting  Methods: Datasets: Traditionally, weather predictions are performed with the help of large complex models of physics, which utilize different atmospheric conditions over a long period of time. These conditions are often ..."
