<a href="https://colab.research.google.com/github/hunkim/ACL-2020-Papers/blob/master/generate_paper_list_with_arxiv_link.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Load Paper List

In [0]:
def read_papers(path):
    papers = [[]]
    with open(path, "r", encoding="utf-8") as f:
        for line in f:
            line = line.strip()
            if line:
                papers[-1].append(line)
            else:
                papers.append([])
    for p in papers:
        assert len(p) == 2
    return papers

In [2]:
longp = read_papers("./data/long.txt")
longp[:3]

[['2kenize: Tying Subword Sequences for Chinese Script Conversion',
  'Pranav A and Isabelle Augenstein'],
 ['A Batch Normalized Inference Network Keeps the KL Vanishing Away',
  'Qile Zhu, Wei Bi, Xiaojiang Liu, Xiyao Ma, Xiaolin Li and Dapeng Wu'],
 ['A Call for More Rigor in Unsupervised Cross-lingual Learning',
  'Mikel Artetxe, Sebastian Ruder, Dani Yogatama, Gorka Labaka and Eneko Agirre']]

In [3]:
len(longp)

571

In [4]:
short = read_papers("./data/short.txt")
short[:3]

[['A Complete Shift-Reduce Chinese Discourse Parser with Robust Dynamic Oracle',
  'Shyh-Shiun Hung, Hen-Hsen Huang and Hsin-Hsi Chen'],
 ['A Diverse Corpus for Evaluating and Developing English Math Word Problem Solvers',
  'Shen-yun Miao, Chao-Chun Liang and Keh-Yih Su'],
 ['A Frame-based Sentence Representation for Machine Reading Comprehension',
  'Shaoru Guo, Ru Li, Hongye Tan, Xiaoli Li, Yong Guan, Hongyan Zhao and Yueping Zhang']]

In [5]:
len(short)

208

In [6]:
demop = read_papers("./data/demo.txt")
demop[:3]

[['ADVISER: A Toolkit for Developing Multi-modal, Multi-domain and Socially-engaged Conversational Agents',
  'Chia-Yu Li, Daniel Ortega, Dirk Väth, Florian Lux, Lindsey Vanderlyn, Maximilian Schmidt, Michael Neumann, Moritz Völkel, Pavel Denisov, Sabrina Jenne, Zorica Kacarevic and Ngoc Thang Vu'],
 ['BENTO: A Visual Platform for Building Clinical NLP Pipelines Based on CodaLab',
  'Yonghao Jin, Fei Li and Hong Yu'],
 ['Clinical-Coder: Assigning Interpretable ICD-10 Codes to Chinese Clinical Notes',
  'Pengfei Cao, Chenwei Yan, xiangling fu, Yubo Chen, Kang Liu, Jun Zhao, Shengping Liu and Weifeng Chong']]

In [7]:
len(demop)

43

In [8]:
student = read_papers("./data/student.txt")
student[:3]

[['#NotAWhore! A Computational Linguistic Perspective of Rape Culture and Victimization on Social Media',
  'Ashima Suvarna and Grusha Bhalla'],
 ['A Geometry-Inspired Attack for Generating Natural Language Adversarial Examples',
  'Zhao Meng and Roger Wattenhofer'],
 ['A Simple and Effective Dependency parser for Telugu',
  'Sneha Nallani, Manish Shrivastava and Dipti Sharma']]

In [9]:
len(student)

49

# Sorting by Topic



In [10]:
import gensim
from gensim.utils import simple_preprocess
from gensim.parsing.preprocessing import STOPWORDS
from nltk.stem import WordNetLemmatizer, SnowballStemmer
from nltk.stem.porter import *
import numpy as np
import nltk

nltk.download('wordnet')
stemmer = SnowballStemmer("english")

def lemmatize_stemming(text):
  return stemmer.stem(WordNetLemmatizer().lemmatize(text, pos='v'))

# Tokenize and lemmatize
def preprocess(text):
  result=[]
  for token in gensim.utils.simple_preprocess(text) :
    if token not in gensim.parsing.preprocessing.STOPWORDS and len(token) > 3:
      result.append(lemmatize_stemming(token))
                
  return result




[nltk_data] Downloading package wordnet to /root/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!


In [0]:
#FIXME: Better way to get human readable topic names from LDA topics?
def list2topiclist(list, num_topics = 8):
  processed_docs = []
  for line in list:
    processed_line = preprocess(line[0])
    processed_docs.append(processed_line)

    dictionary = gensim.corpora.Dictionary(processed_docs)
    bow_corpus = [dictionary.doc2bow(doc) for doc in processed_docs]

  
  lda = gensim.models.LdaModel(bow_corpus, num_topics, 
                               id2word = dictionary, passes = 10)


  def get_topic_title(idx, topn=3):
    topn_terms = [dictionary[x[0]] for x in lda.get_topic_terms(idx, topn)]
    return " ".join(topn_terms)

  # Create topic title
  list_topic_titles = []
  for i in range(num_topics):
    list_topic_titles.append(get_topic_title(i))

  # Assign list to topic
  topic_dict = {}
  for line in list:
    processed_line = preprocess(line[0])
    bow_vector = dictionary.doc2bow(processed_line)
    line_topic = sorted(lda.get_document_topics(bow_vector), 
                        key=lambda tup: tup[1], reverse=True)
    topic_title = list_topic_titles[line_topic[0][0]]

    if topic_title not in topic_dict:
      topic_dict[topic_title] = []

    topic_dict[topic_title].append(line)
  
  return topic_dict
      


In [12]:
print(demop)
topics = list2topiclist(demop)
for topic in topics:
  print(topic)

[['ADVISER: A Toolkit for Developing Multi-modal, Multi-domain and Socially-engaged Conversational Agents', 'Chia-Yu Li, Daniel Ortega, Dirk Väth, Florian Lux, Lindsey Vanderlyn, Maximilian Schmidt, Michael Neumann, Moritz Völkel, Pavel Denisov, Sabrina Jenne, Zorica Kacarevic and Ngoc Thang Vu'], ['BENTO: A Visual Platform for Building Clinical NLP Pipelines Based on CodaLab', 'Yonghao Jin, Fei Li and Hong Yu'], ['Clinical-Coder: Assigning Interpretable ICD-10 Codes to Chinese Clinical Notes', 'Pengfei Cao, Chenwei Yan, xiangling fu, Yubo Chen, Kang Liu, Jun Zhao, Shengping Liu and Weifeng Chong'], ['CLIReval: Evaluating Machine Translation as a Cross-Lingual Information Retrieval Task', 'Shuo Sun, Suzanna Sia and Kevin Duh'], ['Conversation Learner - A Machine Teaching Tool for Building Dialog Managers for Task-Oriented Dialog Systems', 'Swadheen Shukla, Lars Liden, Shahin Shayandeh, Eslam Kamal, Jinchao Li, Matt Mazzola, Thomas Park, Baolin Peng and Jianfeng Gao'], ['ConvLab-2: An O

# Search arXiv Link

In [0]:
from googlesearch import search
import urllib
from bs4 import BeautifulSoup
from difflib import SequenceMatcher
from tqdm import tqdm
import time

def similarity(a, b):
    return SequenceMatcher(None, a, b).ratio()


def search_arxiv_link(title):
    link = None
    for j in search(title, tld="co.in", num=10, stop=1, pause=1.0, user_agent="acl2020"):
        if 'arxiv.org/abs' in j:
            thepage = urllib.request.urlopen(j)
            soup = BeautifulSoup(thepage, "html.parser")
            searched_title = ' '.join(soup.title.text.lower().split()[1:])
            if similarity(title, searched_title) > 0.8:
                link = j
                break
            else:
                print("NOT MATCHED")
                print(title)
                print(searched_title)
    return link

In [0]:
def generate_paper_list_with_arxiv_link(f, papers):
    for p in tqdm(papers):
        title, authors = p
        link = search_arxiv_link(title.lower())
        if link:
            f.write(f"- {title} [[arXiv]]({link})\n")
        else:
            f.write(f"- {title}\n")
    f.write("\n")

In [0]:
def generate_paper_list_with_arxiv_link_topic(f, papers):
  topic_papers = list2topiclist(papers)
  for topic in topic_papers:
    f.write("### " + topic + "\n")
    generate_paper_list_with_arxiv_link(f, topic_papers[topic])


In [19]:
with open("papers_with_arxiv_link_topic.md", "w") as f:
  f.write("## Long Papers\n\n")
  generate_paper_list_with_arxiv_link_topic(f, longp)
  f.write("## Short Papers\n\n")
  generate_paper_list_with_arxiv_link_topic(f, short)
  f.write("## System Demonstrations\n\n")
  generate_paper_list_with_arxiv_link_topic(f, demop)
  f.write("## Student Research Workshop\n\n")
  generate_paper_list_with_arxiv_link_topic(f, student)



  0%|          | 0/69 [00:00<?, ?it/s][A
  1%|▏         | 1/69 [00:02<02:36,  2.30s/it][A
  3%|▎         | 2/69 [00:04<02:30,  2.24s/it][A
  4%|▍         | 3/69 [00:06<02:23,  2.17s/it][A
  6%|▌         | 4/69 [00:08<02:21,  2.18s/it][A
  7%|▋         | 5/69 [00:10<02:17,  2.15s/it][A
  9%|▊         | 6/69 [00:12<02:12,  2.10s/it][A
 10%|█         | 7/69 [00:15<02:18,  2.24s/it][A
 12%|█▏        | 8/69 [00:17<02:19,  2.28s/it][A
 13%|█▎        | 9/69 [00:19<02:15,  2.25s/it][A
 14%|█▍        | 10/69 [00:21<02:10,  2.21s/it][A
 16%|█▌        | 11/69 [00:24<02:06,  2.18s/it][A
 17%|█▋        | 12/69 [00:25<01:59,  2.10s/it][A
 19%|█▉        | 13/69 [00:27<01:55,  2.06s/it][A
 20%|██        | 14/69 [00:30<01:54,  2.09s/it][A
 22%|██▏       | 15/69 [00:32<01:53,  2.10s/it][A
 23%|██▎       | 16/69 [00:34<01:49,  2.07s/it][A
 25%|██▍       | 17/69 [00:36<01:46,  2.05s/it][A
 26%|██▌       | 18/69 [00:38<01:45,  2.07s/it][A
 28%|██▊       | 19/69 [00:40<01:48,  2.17s/it]

NOT MATCHED
zero-shot text classification via reinforced self-training
integrating semantic knowledge to tackle zero-shot text classification



 99%|█████████▊| 68/69 [02:28<00:02,  2.31s/it][A
100%|██████████| 69/69 [02:30<00:00,  2.18s/it]

  0%|          | 0/73 [00:00<?, ?it/s][A
  1%|▏         | 1/73 [00:02<02:56,  2.45s/it][A
  3%|▎         | 2/73 [00:04<02:48,  2.38s/it][A
  4%|▍         | 3/73 [00:06<02:38,  2.26s/it][A
  5%|▌         | 4/73 [00:08<02:29,  2.16s/it][A
  7%|▋         | 5/73 [00:10<02:24,  2.13s/it][A
  8%|▊         | 6/73 [00:12<02:22,  2.12s/it][A
 10%|▉         | 7/73 [00:14<02:17,  2.08s/it][A
 11%|█         | 8/73 [00:17<02:22,  2.19s/it][A

NOT MATCHED
attentive pooling with learnable norms for text representation
attentive pooling networks



 12%|█▏        | 9/73 [00:19<02:21,  2.20s/it][A
 14%|█▎        | 10/73 [00:21<02:19,  2.21s/it][A
 15%|█▌        | 11/73 [00:23<02:16,  2.20s/it][A
 16%|█▋        | 12/73 [00:25<02:11,  2.16s/it][A
 18%|█▊        | 13/73 [00:28<02:10,  2.17s/it][A
 19%|█▉        | 14/73 [00:30<02:06,  2.15s/it][A
 21%|██        | 15/73 [00:32<02:11,  2.27s/it][A
 22%|██▏       | 16/73 [00:34<02:08,  2.25s/it][A
 23%|██▎       | 17/73 [00:37<02:04,  2.23s/it][A

NOT MATCHED
contextualized weak supervision for text classification
weakly-supervised neural text classification



 25%|██▍       | 18/73 [00:39<02:03,  2.25s/it][A
 26%|██▌       | 19/73 [00:41<01:59,  2.22s/it][A
 27%|██▋       | 20/73 [00:43<02:00,  2.27s/it][A
 29%|██▉       | 21/73 [00:46<01:55,  2.21s/it][A
 30%|███       | 22/73 [00:47<01:46,  2.09s/it][A
 32%|███▏      | 23/73 [00:50<01:47,  2.15s/it][A
 33%|███▎      | 24/73 [00:52<01:43,  2.10s/it][A
 34%|███▍      | 25/73 [00:54<01:45,  2.20s/it][A
 36%|███▌      | 26/73 [00:56<01:42,  2.17s/it][A
 37%|███▋      | 27/73 [00:58<01:39,  2.15s/it][A
 38%|███▊      | 28/73 [01:00<01:36,  2.15s/it][A
 40%|███▉      | 29/73 [01:03<01:40,  2.28s/it][A
 41%|████      | 30/73 [01:05<01:35,  2.23s/it][A

NOT MATCHED
explicit semantic decomposition for definition generation
semantic composition and decomposition: from recognition to generation



 42%|████▏     | 31/73 [01:07<01:34,  2.26s/it][A
 44%|████▍     | 32/73 [01:10<01:35,  2.34s/it][A
 45%|████▌     | 33/73 [01:12<01:32,  2.31s/it][A
 47%|████▋     | 34/73 [01:14<01:26,  2.23s/it][A
 48%|████▊     | 35/73 [01:16<01:23,  2.20s/it][A
 49%|████▉     | 36/73 [01:18<01:20,  2.16s/it][A
 51%|█████     | 37/73 [01:21<01:23,  2.33s/it][A
 52%|█████▏    | 38/73 [01:23<01:17,  2.20s/it][A
 53%|█████▎    | 39/73 [01:25<01:16,  2.24s/it][A
 55%|█████▍    | 40/73 [01:27<01:12,  2.20s/it][A
 56%|█████▌    | 41/73 [01:30<01:09,  2.17s/it][A

NOT MATCHED
learning constraints for structured prediction using rectifier networks
adversarial constraint learning for structured prediction



 58%|█████▊    | 42/73 [01:32<01:06,  2.16s/it][A
 59%|█████▉    | 43/73 [01:34<01:06,  2.23s/it][A
 60%|██████    | 44/73 [01:36<01:03,  2.19s/it][A
 62%|██████▏   | 45/73 [01:38<00:59,  2.11s/it][A
 63%|██████▎   | 46/73 [01:40<00:54,  2.03s/it][A
 64%|██████▍   | 47/73 [01:42<00:51,  1.98s/it][A
 66%|██████▌   | 48/73 [01:44<00:50,  2.02s/it][A
 67%|██████▋   | 49/73 [01:46<00:51,  2.13s/it][A
 68%|██████▊   | 50/73 [01:48<00:47,  2.07s/it][A
 70%|██████▉   | 51/73 [01:51<00:47,  2.14s/it][A
 71%|███████   | 52/73 [01:53<00:47,  2.26s/it][A
 73%|███████▎  | 53/73 [01:55<00:45,  2.26s/it][A
 74%|███████▍  | 54/73 [01:58<00:42,  2.24s/it][A
 75%|███████▌  | 55/73 [02:00<00:41,  2.29s/it][A
 77%|███████▋  | 56/73 [02:02<00:37,  2.21s/it][A
 78%|███████▊  | 57/73 [02:04<00:35,  2.21s/it][A
 79%|███████▉  | 58/73 [02:06<00:33,  2.22s/it][A

NOT MATCHED
relation-aware collaborative learning for unified aspect-based sentiment analysis
an interactive multi-task learning network for end-to-end aspect-based sentiment analysis



 81%|████████  | 59/73 [02:09<00:30,  2.21s/it][A
 82%|████████▏ | 60/73 [02:11<00:28,  2.18s/it][A
 84%|████████▎ | 61/73 [02:13<00:25,  2.13s/it][A
 85%|████████▍ | 62/73 [02:15<00:23,  2.13s/it][A
 86%|████████▋ | 63/73 [02:17<00:21,  2.12s/it][A
 88%|████████▊ | 64/73 [02:19<00:19,  2.16s/it][A
 89%|████████▉ | 65/73 [02:22<00:18,  2.34s/it][A

NOT MATCHED
spanmlt: a span-based multi-task learning framework for pair-wise aspect and opinion terms extraction
an interactive multi-task learning network for end-to-end aspect-based sentiment analysis



 90%|█████████ | 66/73 [02:24<00:16,  2.30s/it][A
 92%|█████████▏| 67/73 [02:26<00:13,  2.22s/it][A
 93%|█████████▎| 68/73 [02:28<00:11,  2.20s/it][A
 95%|█████████▍| 69/73 [02:30<00:08,  2.15s/it][A
 96%|█████████▌| 70/73 [02:33<00:06,  2.17s/it][A
 97%|█████████▋| 71/73 [02:35<00:04,  2.21s/it][A
 99%|█████████▊| 72/73 [02:37<00:02,  2.16s/it][A
100%|██████████| 73/73 [02:39<00:00,  2.19s/it]

  0%|          | 0/71 [00:00<?, ?it/s][A
  1%|▏         | 1/71 [00:02<02:50,  2.43s/it][A
  3%|▎         | 2/71 [00:04<02:42,  2.35s/it][A
  4%|▍         | 3/71 [00:06<02:34,  2.28s/it][A
  6%|▌         | 4/71 [00:09<02:34,  2.31s/it][A
  7%|▋         | 5/71 [00:11<02:29,  2.26s/it][A
  8%|▊         | 6/71 [00:13<02:24,  2.22s/it][A
 10%|▉         | 7/71 [00:15<02:23,  2.24s/it][A
 11%|█▏        | 8/71 [00:18<02:23,  2.28s/it][A
 13%|█▎        | 9/71 [00:20<02:17,  2.22s/it][A
 14%|█▍        | 10/71 [00:21<02:09,  2.12s/it][A
 15%|█▌        | 11/71 [00:23<02:05,  2.09s/it][A

NOT MATCHED
curriculum learning for natural language understanding
visualizing and understanding curriculum learning for long short-term memory networks



 23%|██▎       | 16/71 [00:35<02:04,  2.27s/it][A
 24%|██▍       | 17/71 [00:37<02:00,  2.22s/it][A
 25%|██▌       | 18/71 [00:39<01:54,  2.16s/it][A

NOT MATCHED
distilling annotations via active imitation learning
random expert distillation: imitation learning via expert policy support estimation



 27%|██▋       | 19/71 [00:41<01:48,  2.08s/it][A
 28%|██▊       | 20/71 [00:43<01:46,  2.09s/it][A
 30%|██▉       | 21/71 [00:45<01:45,  2.11s/it][A
 31%|███       | 22/71 [00:48<01:48,  2.21s/it][A
 32%|███▏      | 23/71 [00:50<01:46,  2.22s/it][A
 34%|███▍      | 24/71 [00:52<01:43,  2.19s/it][A
 35%|███▌      | 25/71 [00:54<01:37,  2.13s/it][A
 37%|███▋      | 26/71 [00:56<01:35,  2.12s/it][A
 38%|███▊      | 27/71 [00:59<01:39,  2.27s/it][A
 39%|███▉      | 28/71 [01:01<01:36,  2.24s/it][A
 41%|████      | 29/71 [01:03<01:35,  2.27s/it][A
 42%|████▏     | 30/71 [01:05<01:31,  2.23s/it][A
 44%|████▎     | 31/71 [01:07<01:26,  2.16s/it][A
 45%|████▌     | 32/71 [01:10<01:28,  2.27s/it][A
 46%|████▋     | 33/71 [01:12<01:25,  2.25s/it][A
 48%|████▊     | 34/71 [01:14<01:20,  2.17s/it][A
 49%|████▉     | 35/71 [01:16<01:17,  2.16s/it][A

NOT MATCHED
improving disentangled text representation learning with information-theoretic guidance
improving disentangled representation learning with the beta bernoulli process



 51%|█████     | 36/71 [01:19<01:17,  2.20s/it][A
 52%|█████▏    | 37/71 [01:21<01:13,  2.18s/it][A
 54%|█████▎    | 38/71 [01:23<01:10,  2.15s/it][A
 55%|█████▍    | 39/71 [01:25<01:07,  2.09s/it][A
 56%|█████▋    | 40/71 [01:27<01:02,  2.02s/it][A
 58%|█████▊    | 41/71 [01:29<01:01,  2.05s/it][A
 59%|█████▉    | 42/71 [01:31<01:00,  2.08s/it][A
 61%|██████    | 43/71 [01:33<00:58,  2.09s/it][A
 62%|██████▏   | 44/71 [01:35<00:55,  2.07s/it][A
 63%|██████▎   | 45/71 [01:37<00:52,  2.02s/it][A
 65%|██████▍   | 46/71 [01:39<00:52,  2.11s/it][A
 66%|██████▌   | 47/71 [01:41<00:50,  2.12s/it][A
 68%|██████▊   | 48/71 [01:44<00:49,  2.13s/it][A
 69%|██████▉   | 49/71 [01:46<00:47,  2.14s/it][A
 70%|███████   | 50/71 [01:48<00:44,  2.13s/it][A
 72%|███████▏  | 51/71 [01:50<00:41,  2.09s/it][A
 73%|███████▎  | 52/71 [01:52<00:41,  2.16s/it][A
 75%|███████▍  | 53/71 [01:54<00:38,  2.14s/it][A
 76%|███████▌  | 54/71 [01:56<00:36,  2.14s/it][A
 77%|███████▋  | 55/71 [01:58<

NOT MATCHED
bilingual dictionary based neural machine translation without using parallel sentences
bridging neural machine translation and bilingual dictionaries



 15%|█▌        | 10/66 [00:21<01:57,  2.10s/it][A
 17%|█▋        | 11/66 [00:23<01:52,  2.05s/it][A
 18%|█▊        | 12/66 [00:25<01:48,  2.01s/it][A
 20%|█▉        | 13/66 [00:27<01:47,  2.03s/it][A
 21%|██        | 14/66 [00:29<01:47,  2.07s/it][A
 23%|██▎       | 15/66 [00:31<01:49,  2.14s/it][A
 24%|██▍       | 16/66 [00:34<01:50,  2.20s/it][A
 26%|██▌       | 17/66 [00:36<01:46,  2.17s/it][A
 27%|██▋       | 18/66 [00:38<01:41,  2.11s/it][A
 29%|██▉       | 19/66 [00:40<01:35,  2.04s/it][A
 30%|███       | 20/66 [00:42<01:35,  2.07s/it][A
 32%|███▏      | 21/66 [00:44<01:37,  2.17s/it][A
 33%|███▎      | 22/66 [00:46<01:35,  2.17s/it][A
 35%|███▍      | 23/66 [00:48<01:32,  2.14s/it][A
 36%|███▋      | 24/66 [00:51<01:30,  2.16s/it][A
 38%|███▊      | 25/66 [00:53<01:26,  2.11s/it][A
 39%|███▉      | 26/66 [00:55<01:26,  2.15s/it][A

NOT MATCHED
graph neural news recommendation with unsupervised preference disentanglement
graph neural news recommendation with long-term and short-term interest modeling



 41%|████      | 27/66 [00:57<01:22,  2.13s/it][A
 42%|████▏     | 28/66 [00:59<01:19,  2.10s/it][A
 44%|████▍     | 29/66 [01:01<01:17,  2.11s/it][A
 45%|████▌     | 30/66 [01:03<01:14,  2.07s/it][A
 47%|████▋     | 31/66 [01:05<01:14,  2.14s/it][A
 48%|████▊     | 32/66 [01:07<01:11,  2.10s/it][A
 50%|█████     | 33/66 [01:10<01:18,  2.37s/it][A
 52%|█████▏    | 34/66 [01:12<01:10,  2.21s/it][A
 53%|█████▎    | 35/66 [01:14<01:06,  2.15s/it][A
 55%|█████▍    | 36/66 [01:16<01:02,  2.07s/it][A
 56%|█████▌    | 37/66 [01:18<01:00,  2.07s/it][A
 58%|█████▊    | 38/66 [01:20<00:58,  2.09s/it][A
 59%|█████▉    | 39/66 [01:22<00:55,  2.06s/it][A
 61%|██████    | 40/66 [01:24<00:54,  2.10s/it][A
 62%|██████▏   | 41/66 [01:27<00:53,  2.13s/it][A
 64%|██████▎   | 42/66 [01:29<00:50,  2.10s/it][A
 65%|██████▌   | 43/66 [01:31<00:48,  2.11s/it][A
 67%|██████▋   | 44/66 [01:33<00:45,  2.07s/it][A
 68%|██████▊   | 45/66 [01:35<00:46,  2.21s/it][A
 70%|██████▉   | 46/66 [01:37<

NOT MATCHED
unknown intent detection using gaussian mixture model with an application to zero-shot intent classification
zero-shot user intent detection via capsule neural networks



  1%|▏         | 1/74 [00:02<02:31,  2.08s/it][A
  3%|▎         | 2/74 [00:04<02:33,  2.14s/it][A
  4%|▍         | 3/74 [00:06<02:24,  2.03s/it][A
  5%|▌         | 4/74 [00:08<02:26,  2.09s/it][A
  7%|▋         | 5/74 [00:10<02:23,  2.09s/it][A

NOT MATCHED
adaptive compression of word embeddings
online embedding compression for text classification using low rank matrix factorization



  8%|▊         | 6/74 [00:12<02:20,  2.07s/it][A
  9%|▉         | 7/74 [00:14<02:18,  2.07s/it][A
 11%|█         | 8/74 [00:18<02:49,  2.56s/it][A
 12%|█▏        | 9/74 [00:20<02:42,  2.50s/it][A
 14%|█▎        | 10/74 [00:22<02:33,  2.40s/it][A

NOT MATCHED
cross-lingual unsupervised sentiment classification with multi-view transfer learning
multi-source cross-lingual model transfer: learning what to share



 15%|█▍        | 11/74 [00:24<02:26,  2.33s/it][A
 16%|█▌        | 12/74 [00:27<02:24,  2.33s/it][A
 18%|█▊        | 13/74 [00:29<02:16,  2.24s/it][A
 19%|█▉        | 14/74 [00:31<02:09,  2.15s/it][A
 20%|██        | 15/74 [00:33<02:10,  2.21s/it][A
 22%|██▏       | 16/74 [00:36<02:19,  2.40s/it][A
 23%|██▎       | 17/74 [00:38<02:09,  2.28s/it][A
 24%|██▍       | 18/74 [00:41<02:16,  2.43s/it][A
 26%|██▌       | 19/74 [00:43<02:06,  2.30s/it][A
 27%|██▋       | 20/74 [00:45<02:03,  2.29s/it][A
 28%|██▊       | 21/74 [00:47<01:58,  2.24s/it][A
 30%|██▉       | 22/74 [00:50<01:59,  2.30s/it][A
 31%|███       | 23/74 [00:52<01:56,  2.29s/it][A
 32%|███▏      | 24/74 [00:54<01:47,  2.15s/it][A
 34%|███▍      | 25/74 [00:56<01:53,  2.31s/it][A
 35%|███▌      | 26/74 [00:58<01:48,  2.26s/it][A
 36%|███▋      | 27/74 [01:00<01:42,  2.19s/it][A
 38%|███▊      | 28/74 [01:03<01:40,  2.19s/it][A
 39%|███▉      | 29/74 [01:05<01:40,  2.23s/it][A
 41%|████      | 30/74 [01:07<

NOT MATCHED
meta-reinforced multi-domain state generator for dialogue systems
transferable multi-domain state generator for task-oriented dialogue systems



 57%|█████▋    | 42/74 [01:33<01:07,  2.11s/it][A
 58%|█████▊    | 43/74 [01:35<01:05,  2.11s/it][A
 59%|█████▉    | 44/74 [01:37<01:04,  2.13s/it][A
 61%|██████    | 45/74 [01:40<01:04,  2.22s/it][A
 62%|██████▏   | 46/74 [01:42<00:58,  2.09s/it][A
 64%|██████▎   | 47/74 [01:44<01:00,  2.24s/it][A
 65%|██████▍   | 48/74 [01:47<00:59,  2.30s/it][A
 66%|██████▌   | 49/74 [01:49<00:56,  2.28s/it][A
 68%|██████▊   | 50/74 [01:51<00:52,  2.19s/it][A
 69%|██████▉   | 51/74 [01:53<00:50,  2.18s/it][A
 70%|███████   | 52/74 [01:57<00:56,  2.56s/it][A
 72%|███████▏  | 53/74 [01:59<00:50,  2.40s/it][A
 73%|███████▎  | 54/74 [02:01<00:46,  2.34s/it][A
 74%|███████▍  | 55/74 [02:03<00:42,  2.22s/it][A
 76%|███████▌  | 56/74 [02:05<00:39,  2.20s/it][A
 77%|███████▋  | 57/74 [02:07<00:37,  2.19s/it][A
 78%|███████▊  | 58/74 [02:09<00:35,  2.20s/it][A
 80%|███████▉  | 59/74 [02:11<00:32,  2.16s/it][A
 81%|████████  | 60/74 [02:13<00:29,  2.14s/it][A
 82%|████████▏ | 61/74 [02:16<

NOT MATCHED
addressing posterior collapse with mutual information for improved variational neural machine translation
improved variational neural machine translation by promoting mutual information



  6%|▌         | 5/89 [00:10<02:51,  2.04s/it][A
  7%|▋         | 6/89 [00:12<02:50,  2.05s/it][A
  8%|▊         | 7/89 [00:14<02:50,  2.08s/it][A
  9%|▉         | 8/89 [00:17<02:59,  2.22s/it][A
 10%|█         | 9/89 [00:19<03:00,  2.26s/it][A
 11%|█         | 10/89 [00:21<02:53,  2.19s/it][A
 12%|█▏        | 11/89 [00:24<03:01,  2.33s/it][A
 13%|█▎        | 12/89 [00:26<03:03,  2.38s/it][A
 15%|█▍        | 13/89 [00:28<02:54,  2.30s/it][A
 16%|█▌        | 14/89 [00:30<02:45,  2.21s/it][A
 17%|█▋        | 15/89 [00:33<02:49,  2.29s/it][A
 18%|█▊        | 16/89 [00:35<02:46,  2.28s/it][A

NOT MATCHED
ecpe-2d: emotion-cause pair extraction based on joint two-dimensional representation, interaction and prediction
emotion-cause pair extraction: a new task to emotion analysis in texts



 19%|█▉        | 17/89 [00:37<02:42,  2.26s/it][A
 20%|██        | 18/89 [00:39<02:39,  2.25s/it][A

NOT MATCHED
effective inter-clause modeling for end-to-end emotion-cause pair extraction
end-to-end emotion-cause pair extraction via learning to link



 21%|██▏       | 19/89 [00:41<02:28,  2.12s/it][A
 22%|██▏       | 20/89 [00:43<02:23,  2.08s/it][A
 24%|██▎       | 21/89 [00:45<02:19,  2.05s/it][A
 25%|██▍       | 22/89 [00:48<02:31,  2.27s/it][A
 26%|██▌       | 23/89 [00:50<02:23,  2.18s/it][A
 27%|██▋       | 24/89 [00:52<02:22,  2.19s/it][A
 28%|██▊       | 25/89 [00:54<02:22,  2.22s/it][A
 29%|██▉       | 26/89 [00:57<02:20,  2.23s/it][A
 30%|███       | 27/89 [00:59<02:22,  2.30s/it][A
 31%|███▏      | 28/89 [01:01<02:17,  2.25s/it][A
 33%|███▎      | 29/89 [01:04<02:19,  2.33s/it][A
 34%|███▎      | 30/89 [01:07<02:25,  2.47s/it][A
 35%|███▍      | 31/89 [01:08<02:12,  2.29s/it][A
 36%|███▌      | 32/89 [01:10<02:04,  2.18s/it][A
 37%|███▋      | 33/89 [01:13<02:03,  2.21s/it][A
 38%|███▊      | 34/89 [01:15<02:01,  2.21s/it][A
 39%|███▉      | 35/89 [01:18<02:11,  2.43s/it][A
 40%|████      | 36/89 [01:20<02:04,  2.35s/it][A
 42%|████▏     | 37/89 [01:22<01:55,  2.23s/it][A
 43%|████▎     | 38/89 [01:24<

NOT MATCHED
predicting the topical stance and political leaning of media using tweets
predicting the topical stance of media and popular twitter users



 57%|█████▋    | 51/89 [01:52<01:24,  2.21s/it][A
 58%|█████▊    | 52/89 [01:54<01:18,  2.13s/it][A
 60%|█████▉    | 53/89 [01:56<01:18,  2.17s/it][A
 61%|██████    | 54/89 [01:58<01:16,  2.17s/it][A
 62%|██████▏   | 55/89 [02:01<01:15,  2.21s/it][A
 63%|██████▎   | 56/89 [02:03<01:11,  2.17s/it][A
 64%|██████▍   | 57/89 [02:05<01:09,  2.16s/it][A
 65%|██████▌   | 58/89 [02:07<01:05,  2.11s/it][A
 66%|██████▋   | 59/89 [02:09<01:03,  2.11s/it][A
 67%|██████▋   | 60/89 [02:11<01:01,  2.12s/it][A
 69%|██████▊   | 61/89 [02:13<00:59,  2.11s/it][A
 70%|██████▉   | 62/89 [02:16<01:00,  2.22s/it][A
 71%|███████   | 63/89 [02:18<00:59,  2.30s/it][A
 72%|███████▏  | 64/89 [02:21<00:56,  2.26s/it][A
 73%|███████▎  | 65/89 [02:23<00:53,  2.22s/it][A
 74%|███████▍  | 66/89 [02:25<00:52,  2.30s/it][A
 75%|███████▌  | 67/89 [02:27<00:50,  2.30s/it][A
 76%|███████▋  | 68/89 [02:30<00:48,  2.29s/it][A
 78%|███████▊  | 69/89 [02:32<00:47,  2.35s/it][A
 79%|███████▊  | 70/89 [02:35<

NOT MATCHED
structural information preserving for graph-to-text generation
structural neural encoders for amr-to-text generation



 80%|███████▉  | 71/89 [02:37<00:41,  2.33s/it][A
 81%|████████  | 72/89 [02:39<00:39,  2.34s/it][A
 82%|████████▏ | 73/89 [02:42<00:38,  2.40s/it][A
 83%|████████▎ | 74/89 [02:44<00:34,  2.32s/it][A
 84%|████████▍ | 75/89 [02:46<00:30,  2.18s/it][A
 85%|████████▌ | 76/89 [02:48<00:28,  2.18s/it][A
 87%|████████▋ | 77/89 [02:50<00:25,  2.10s/it][A
 88%|████████▊ | 78/89 [02:52<00:23,  2.13s/it][A
 89%|████████▉ | 79/89 [02:54<00:21,  2.16s/it][A
 90%|████████▉ | 80/89 [02:57<00:19,  2.21s/it][A
 91%|█████████ | 81/89 [02:59<00:17,  2.16s/it][A
 92%|█████████▏| 82/89 [03:01<00:14,  2.10s/it][A
 93%|█████████▎| 83/89 [03:03<00:12,  2.15s/it][A
 94%|█████████▍| 84/89 [03:05<00:10,  2.15s/it][A
 96%|█████████▌| 85/89 [03:07<00:08,  2.11s/it][A
 97%|█████████▋| 86/89 [03:09<00:06,  2.10s/it][A
 98%|█████████▊| 87/89 [03:11<00:04,  2.08s/it][A
 99%|█████████▉| 88/89 [03:13<00:02,  2.08s/it][A
100%|██████████| 89/89 [03:16<00:00,  2.20s/it]

  0%|          | 0/84 [00:00<?, 

NOT MATCHED
improving image captioning with better use of caption
hidden state guidance: improving image captioning using an image conditioned autoencoder



 48%|████▊     | 40/84 [01:28<01:37,  2.21s/it][A

NOT MATCHED
improving multimodal named entity recognition via entity span detection with unified multimodal transformer
a multimodal deep learning approach for named entity recognition from social media



 49%|████▉     | 41/84 [01:30<01:37,  2.28s/it][A

NOT MATCHED
inset: sentence infilling with inter-sentential transformer
inset: sentence infilling with inter-sentential generative pre-training



 50%|█████     | 42/84 [01:33<01:37,  2.32s/it][A
 51%|█████     | 43/84 [01:35<01:33,  2.29s/it][A
 52%|█████▏    | 44/84 [01:37<01:32,  2.30s/it][A
 54%|█████▎    | 45/84 [01:39<01:27,  2.24s/it][A
 55%|█████▍    | 46/84 [01:42<01:23,  2.19s/it][A
 56%|█████▌    | 47/84 [01:44<01:23,  2.25s/it][A

NOT MATCHED
learning to ask more: semi-autoregressive sequential question generation under dual-graph interaction
semi-autoregressive neural machine translation



 57%|█████▋    | 48/84 [01:46<01:19,  2.22s/it][A
 58%|█████▊    | 49/84 [01:49<01:20,  2.30s/it][A
 60%|█████▉    | 50/84 [01:51<01:16,  2.24s/it][A
 61%|██████    | 51/84 [01:53<01:12,  2.18s/it][A
 62%|██████▏   | 52/84 [01:55<01:10,  2.22s/it][A
 63%|██████▎   | 53/84 [01:57<01:08,  2.21s/it][A
 64%|██████▍   | 54/84 [01:59<01:04,  2.14s/it][A
 65%|██████▌   | 55/84 [02:01<01:01,  2.12s/it][A
 67%|██████▋   | 56/84 [02:03<00:59,  2.14s/it][A
 68%|██████▊   | 57/84 [02:06<00:58,  2.15s/it][A
 69%|██████▉   | 58/84 [02:08<00:54,  2.10s/it][A

NOT MATCHED
premise selection in natural language mathematical texts
natural language premise selection: finding supporting statements for mathematical text



 70%|███████   | 59/84 [02:10<00:54,  2.16s/it][A
 71%|███████▏  | 60/84 [02:12<00:53,  2.24s/it][A

NOT MATCHED
reinceptione: relation-aware inception network with joint local-global structural information for knowledge graph embedding
relation-aware entity alignment for heterogeneous knowledge graphs



 73%|███████▎  | 61/84 [02:15<00:51,  2.26s/it][A
 74%|███████▍  | 62/84 [02:17<00:47,  2.18s/it][A
 75%|███████▌  | 63/84 [02:19<00:44,  2.13s/it][A
 76%|███████▌  | 64/84 [02:21<00:44,  2.20s/it][A
 77%|███████▋  | 65/84 [02:23<00:40,  2.13s/it][A
 79%|███████▊  | 66/84 [02:25<00:39,  2.20s/it][A
 80%|███████▉  | 67/84 [02:27<00:36,  2.12s/it][A
 81%|████████  | 68/84 [02:29<00:33,  2.12s/it][A
 82%|████████▏ | 69/84 [02:32<00:31,  2.13s/it][A
 83%|████████▎ | 70/84 [02:34<00:31,  2.26s/it][A
 85%|████████▍ | 71/84 [02:36<00:29,  2.27s/it][A
 86%|████████▌ | 72/84 [02:38<00:26,  2.21s/it][A
 87%|████████▋ | 73/84 [02:41<00:24,  2.20s/it][A
 88%|████████▊ | 74/84 [02:43<00:21,  2.18s/it][A
 89%|████████▉ | 75/84 [02:45<00:19,  2.17s/it][A
 90%|█████████ | 76/84 [02:48<00:18,  2.31s/it][A
 92%|█████████▏| 77/84 [02:50<00:15,  2.27s/it][A
 93%|█████████▎| 78/84 [02:52<00:13,  2.29s/it][A
 94%|█████████▍| 79/84 [02:54<00:11,  2.24s/it][A
 95%|█████████▌| 80/84 [02:56<

NOT MATCHED
camouflaged chinese spam content detection with semi-supervised generative active learning
detect camouflaged spam content via stoneskipping: graph and text joint embedding for chinese character variation representation



 22%|██▏       | 6/27 [00:13<00:48,  2.32s/it][A
 26%|██▌       | 7/27 [00:15<00:44,  2.21s/it][A
 30%|██▉       | 8/27 [00:17<00:41,  2.17s/it][A
 33%|███▎      | 9/27 [00:19<00:38,  2.12s/it][A
 37%|███▋      | 10/27 [00:21<00:34,  2.06s/it][A
 41%|████      | 11/27 [00:23<00:33,  2.11s/it][A
 44%|████▍     | 12/27 [00:27<00:39,  2.60s/it][A

NOT MATCHED
interpretable operational risk classification with semi-supervised variational autoencoder
disentangled variational auto-encoder for semi-supervised learning



 48%|████▊     | 13/27 [00:29<00:34,  2.45s/it][A
 52%|█████▏    | 14/27 [00:32<00:31,  2.43s/it][A
 56%|█████▌    | 15/27 [00:34<00:28,  2.35s/it][A

NOT MATCHED
learning low-resource end-to-end goal-oriented dialog for fast and reliable system deployment
learning end-to-end goal-oriented dialog



 59%|█████▉    | 16/27 [00:36<00:25,  2.34s/it][A
 63%|██████▎   | 17/27 [00:38<00:22,  2.22s/it][A
 67%|██████▋   | 18/27 [00:40<00:19,  2.12s/it][A
 70%|███████   | 19/27 [00:42<00:16,  2.12s/it][A
 74%|███████▍  | 20/27 [00:44<00:14,  2.07s/it][A
 78%|███████▊  | 21/27 [00:46<00:12,  2.09s/it][A
 81%|████████▏ | 22/27 [00:48<00:10,  2.00s/it][A
 85%|████████▌ | 23/27 [00:50<00:08,  2.06s/it][A
 89%|████████▉ | 24/27 [00:52<00:06,  2.00s/it][A
 93%|█████████▎| 25/27 [00:54<00:04,  2.04s/it][A
 96%|█████████▋| 26/27 [00:56<00:02,  2.12s/it][A
100%|██████████| 27/27 [00:59<00:00,  2.19s/it]

  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:36,  2.30s/it][A
 12%|█▏        | 2/17 [00:04<00:33,  2.24s/it][A
 18%|█▊        | 3/17 [00:06<00:30,  2.20s/it][A
 24%|██▎       | 4/17 [00:08<00:27,  2.15s/it][A
 29%|██▉       | 5/17 [00:10<00:26,  2.18s/it][A
 35%|███▌      | 6/17 [00:13<00:24,  2.21s/it][A
 41%|████      | 7/17 [00:15<00:22,  2.27s/it]

NOT MATCHED
video-grounded dialogues with pretrained generation language models
unified language model pre-training for natural language understanding and generation



 93%|█████████▎| 28/30 [01:00<00:04,  2.12s/it][A
 97%|█████████▋| 29/30 [01:02<00:02,  2.12s/it][A
100%|██████████| 30/30 [01:04<00:00,  2.15s/it]

  0%|          | 0/26 [00:00<?, ?it/s][A
  4%|▍         | 1/26 [00:02<01:04,  2.58s/it][A
  8%|▊         | 2/26 [00:04<00:58,  2.42s/it][A
 12%|█▏        | 3/26 [00:06<00:52,  2.28s/it][A
 15%|█▌        | 4/26 [00:08<00:47,  2.18s/it][A
 19%|█▉        | 5/26 [00:10<00:44,  2.14s/it][A
 23%|██▎       | 6/26 [00:12<00:41,  2.08s/it][A
 27%|██▋       | 7/26 [00:14<00:39,  2.10s/it][A
 31%|███       | 8/26 [00:16<00:37,  2.08s/it][A
 35%|███▍      | 9/26 [00:19<00:39,  2.31s/it][A
 38%|███▊      | 10/26 [00:21<00:36,  2.28s/it][A
 42%|████▏     | 11/26 [00:23<00:33,  2.21s/it][A
 46%|████▌     | 12/26 [00:26<00:32,  2.29s/it][A
 50%|█████     | 13/26 [00:28<00:28,  2.23s/it][A
 54%|█████▍    | 14/26 [00:30<00:27,  2.29s/it][A
 58%|█████▊    | 15/26 [00:33<00:25,  2.35s/it][A
 62%|██████▏   | 16/26 [00:35<00:23,  2.38s/it][A

NOT MATCHED
content word aware neural machine translation
selective attention for context-aware neural machine translation



 21%|██        | 9/43 [00:19<01:13,  2.16s/it][A
 23%|██▎       | 10/43 [00:21<01:12,  2.20s/it][A
 26%|██▌       | 11/43 [00:23<01:08,  2.14s/it][A
 28%|██▊       | 12/43 [00:26<01:08,  2.20s/it][A
 30%|███       | 13/43 [00:28<01:05,  2.17s/it][A
 33%|███▎      | 14/43 [00:29<01:00,  2.07s/it][A
 35%|███▍      | 15/43 [00:32<00:58,  2.10s/it][A
 37%|███▋      | 16/43 [00:34<00:55,  2.07s/it][A
 40%|███▉      | 17/43 [00:36<00:54,  2.10s/it][A

NOT MATCHED
language-aware interlingua for multilingual neural machine translation
a neural interlingua for multilingual machine translation



 42%|████▏     | 18/43 [00:38<00:53,  2.14s/it][A
 44%|████▍     | 19/43 [00:40<00:51,  2.15s/it][A
 47%|████▋     | 20/43 [00:42<00:48,  2.11s/it][A
 49%|████▉     | 21/43 [00:44<00:46,  2.09s/it][A
 51%|█████     | 22/43 [00:46<00:43,  2.06s/it][A
 53%|█████▎    | 23/43 [00:48<00:40,  2.01s/it][A
 56%|█████▌    | 24/43 [00:50<00:39,  2.07s/it][A

NOT MATCHED
neural graph matching networks for chinese short text matching
graph matching networks for learning the similarity of graph structured objects



 58%|█████▊    | 25/43 [00:53<00:38,  2.14s/it][A
 60%|██████    | 26/43 [00:55<00:36,  2.13s/it][A
 63%|██████▎   | 27/43 [00:57<00:33,  2.07s/it][A
 65%|██████▌   | 28/43 [00:59<00:31,  2.09s/it][A
 67%|██████▋   | 29/43 [01:01<00:31,  2.24s/it][A
 70%|██████▉   | 30/43 [01:04<00:28,  2.21s/it][A
 72%|███████▏  | 31/43 [01:06<00:27,  2.28s/it][A
 74%|███████▍  | 32/43 [01:08<00:25,  2.28s/it][A
 77%|███████▋  | 33/43 [01:10<00:22,  2.24s/it][A
 79%|███████▉  | 34/43 [01:13<00:20,  2.27s/it][A
 81%|████████▏ | 35/43 [01:15<00:17,  2.23s/it][A
 84%|████████▎ | 36/43 [01:18<00:16,  2.34s/it][A
 86%|████████▌ | 37/43 [01:20<00:13,  2.27s/it][A
 88%|████████▊ | 38/43 [01:22<00:11,  2.26s/it][A
 91%|█████████ | 39/43 [01:24<00:08,  2.16s/it][A
 93%|█████████▎| 40/43 [01:26<00:06,  2.12s/it][A
 95%|█████████▌| 41/43 [01:28<00:04,  2.15s/it][A
 98%|█████████▊| 42/43 [01:31<00:02,  2.28s/it][A

NOT MATCHED
``you sound just like your father’’ commercial machine translation systems include stylistic biases
reducing gender bias in neural machine translation as a domain adaptation problem



100%|██████████| 43/43 [01:33<00:00,  2.16s/it]

  0%|          | 0/21 [00:00<?, ?it/s][A
  5%|▍         | 1/21 [00:02<00:47,  2.37s/it][A
 10%|▉         | 2/21 [00:05<00:47,  2.50s/it][A
 14%|█▍        | 3/21 [00:08<00:46,  2.60s/it][A
 19%|█▉        | 4/21 [00:09<00:40,  2.39s/it][A
 24%|██▍       | 5/21 [00:11<00:36,  2.29s/it][A
 29%|██▊       | 6/21 [00:13<00:32,  2.18s/it][A
 33%|███▎      | 7/21 [00:16<00:31,  2.26s/it][A
 38%|███▊      | 8/21 [00:18<00:30,  2.35s/it][A
 43%|████▎     | 9/21 [00:21<00:27,  2.28s/it][A
 48%|████▊     | 10/21 [00:23<00:25,  2.36s/it][A
 52%|█████▏    | 11/21 [00:25<00:22,  2.30s/it][A
 57%|█████▋    | 12/21 [00:27<00:19,  2.18s/it][A
 62%|██████▏   | 13/21 [00:29<00:17,  2.19s/it][A
 67%|██████▋   | 14/21 [00:32<00:15,  2.20s/it][A
 71%|███████▏  | 15/21 [00:34<00:13,  2.22s/it][A
 76%|███████▌  | 16/21 [00:36<00:11,  2.27s/it][A
 81%|████████  | 17/21 [00:39<00:09,  2.32s/it][A
 86%|████████▌ | 18/21 [00:41<00:06,  2.27s/it][A

NOT MATCHED
tree-structured neural topic model
structured neural topic models for reviews



  5%|▌         | 1/19 [00:01<00:34,  1.89s/it][A
 11%|█         | 2/19 [00:04<00:33,  1.96s/it][A
 16%|█▌        | 3/19 [00:06<00:32,  2.06s/it][A
 21%|██        | 4/19 [00:08<00:31,  2.09s/it][A
 26%|██▋       | 5/19 [00:11<00:31,  2.25s/it][A
 32%|███▏      | 6/19 [00:13<00:28,  2.19s/it][A
 37%|███▋      | 7/19 [00:15<00:27,  2.31s/it][A
 42%|████▏     | 8/19 [00:17<00:24,  2.18s/it][A
 47%|████▋     | 9/19 [00:19<00:21,  2.11s/it][A
 53%|█████▎    | 10/19 [00:21<00:19,  2.15s/it][A

NOT MATCHED
multimodal and multiresolution speech recognition with transformers
multiresolution and multimodal speech recognition with transformers



 58%|█████▊    | 11/19 [00:24<00:18,  2.26s/it][A
 63%|██████▎   | 12/19 [00:26<00:15,  2.22s/it][A
 68%|██████▊   | 13/19 [00:28<00:12,  2.14s/it][A
 74%|███████▎  | 14/19 [00:30<00:10,  2.13s/it][A
 79%|███████▉  | 15/19 [00:33<00:09,  2.27s/it][A
 84%|████████▍ | 16/19 [00:35<00:06,  2.28s/it][A
 89%|████████▉ | 17/19 [00:37<00:04,  2.25s/it][A
 95%|█████████▍| 18/19 [00:39<00:02,  2.24s/it][A
100%|██████████| 19/19 [00:42<00:00,  2.21s/it]

  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.49s/it][A
 29%|██▊       | 2/7 [00:04<00:11,  2.37s/it][A
 43%|████▎     | 3/7 [00:06<00:09,  2.35s/it][A
 57%|█████▋    | 4/7 [00:08<00:06,  2.21s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.24s/it][A
 86%|████████▌ | 6/7 [00:13<00:02,  2.22s/it][A
100%|██████████| 7/7 [00:15<00:00,  2.20s/it]

  0%|          | 0/3 [00:00<?, ?it/s][A
 33%|███▎      | 1/3 [00:02<00:04,  2.06s/it][A
 67%|██████▋   | 2/3 [00:03<00:02,  2.02s/it][A
100%|██████████| 3/3 

NOT MATCHED
a geometry-inspired attack for generating natural language adversarial examples
a geometry-inspired decision-based attack



 38%|███▊      | 3/8 [00:06<00:10,  2.09s/it][A
 50%|█████     | 4/8 [00:08<00:08,  2.18s/it][A
 62%|██████▎   | 5/8 [00:11<00:06,  2.23s/it][A
 75%|███████▌  | 6/8 [00:13<00:04,  2.15s/it][A
 88%|████████▊ | 7/8 [00:15<00:02,  2.20s/it][A
100%|██████████| 8/8 [00:17<00:00,  2.20s/it]

  0%|          | 0/5 [00:00<?, ?it/s][A
 20%|██        | 1/5 [00:01<00:07,  1.94s/it][A
 40%|████      | 2/5 [00:04<00:06,  2.03s/it][A
 60%|██████    | 3/5 [00:06<00:04,  2.08s/it][A
 80%|████████  | 4/5 [00:08<00:02,  2.20s/it][A
100%|██████████| 5/5 [00:10<00:00,  2.16s/it]

  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:10,  2.16s/it][A
 33%|███▎      | 2/6 [00:04<00:08,  2.12s/it][A
 50%|█████     | 3/6 [00:06<00:06,  2.16s/it][A
 67%|██████▋   | 4/6 [00:08<00:04,  2.21s/it][A
 83%|████████▎ | 5/6 [00:10<00:02,  2.12s/it][A
100%|██████████| 6/6 [00:12<00:00,  2.15s/it]

  0%|          | 0/5 [00:00<?, ?it/s][A

NOT MATCHED
unsupervised multilingual sentence embeddings for parallel corpus mining
margin-based parallel corpus mining with multilingual sentence embeddings



 20%|██        | 1/5 [00:02<00:08,  2.06s/it][A
 40%|████      | 2/5 [00:04<00:06,  2.12s/it][A
 60%|██████    | 3/5 [00:07<00:04,  2.29s/it][A
 80%|████████  | 4/5 [00:09<00:02,  2.32s/it][A
100%|██████████| 5/5 [00:11<00:00,  2.29s/it]

  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.09s/it][A
 25%|██▌       | 2/8 [00:04<00:13,  2.18s/it][A
 38%|███▊      | 3/8 [00:06<00:10,  2.18s/it][A
 50%|█████     | 4/8 [00:09<00:09,  2.27s/it][A
 62%|██████▎   | 5/8 [00:11<00:06,  2.23s/it][A
 75%|███████▌  | 6/8 [00:14<00:05,  2.65s/it][A

NOT MATCHED
υbleu: uncertainty-aware automatic evaluation method for open-domain dialogue systems
better automatic evaluation of open-domain dialogue systems with contextualized embeddings



 88%|████████▊ | 7/8 [00:17<00:02,  2.51s/it][A
100%|██████████| 8/8 [00:19<00:00,  2.41s/it]

  0%|          | 0/3 [00:00<?, ?it/s][A
 33%|███▎      | 1/3 [00:02<00:04,  2.21s/it][A
 67%|██████▋   | 2/3 [00:04<00:02,  2.12s/it][A
100%|██████████| 3/3 [00:06<00:00,  2.11s/it]

  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.53s/it][A
 29%|██▊       | 2/7 [00:04<00:11,  2.37s/it][A
 43%|████▎     | 3/7 [00:06<00:09,  2.29s/it][A
 57%|█████▋    | 4/7 [00:08<00:06,  2.27s/it][A
 71%|███████▏  | 5/7 [00:10<00:04,  2.20s/it][A
 86%|████████▌ | 6/7 [00:13<00:02,  2.30s/it][A
100%|██████████| 7/7 [00:15<00:00,  2.23s/it]

  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.24s/it][A
 29%|██▊       | 2/7 [00:04<00:11,  2.29s/it][A
 43%|████▎     | 3/7 [00:06<00:08,  2.23s/it][A
 57%|█████▋    | 4/7 [00:09<00:07,  2.36s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.38s/it][A
 86%|████████▌ | 6/7 [00:14<00:02,  2.40s/it][A


In [0]:
with open("papers_with_arxiv_link.md", "w") as f:
    f.write("## Long Papers\n\n")
    generate_paper_list_with_arxiv_link(f, longp)
    f.write("## Short Papers\n\n")
    generate_paper_list_with_arxiv_link(f, short)
    f.write("## System Demonstrations\n\n")
    generate_paper_list_with_arxiv_link(f, demop)
    f.write("## Student Research Workshop\n\n")
    generate_paper_list_with_arxiv_link(f, student)