bibtex.bib

@inproceedings{DBLP:conf:acl:ChenZZK022,
  author    = {Yanda Chen and
               Ruiqi Zhong and
               Sheng Zha and
               George Karypis and
               He He},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Meta-learning via Language Model In-context Tuning},
  booktitle = {ACL},
  pages     = {719--730},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.53},
  doi       = {10.18653/v1/2022.acl-long.53},
  timestamp = {Mon, 01 Aug 2022 16:27:45 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/ChenZZK022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning, Meta Learning},
  plm={BERT, DeBERTa, GPT-2}
}
@string(DBLP:conf:acl:ChenZZK022="This paper proposes in-context tuning, which recasts task adaptation and prediction as a simple sequence prediction problem: to form the input sequence,  concatenate the task instruction, labeled in-context examples, and the target input to predict; to meta train the model to learn from in-context examples, finetune a PLM to predict the target label given the input sequence on a collection of tasks (very similar to MetaICL). On LAMA and BinaryClfs, the proposed method outperforms MAML.")

@article{DBLP:journals/corr/abs-2210-12810,
  author    = {Xingyao Wang and
               Sha Li and
               Heng Ji},
  title     = {Code4Struct: Code Generation for Few-Shot Structured Prediction from
               Natural Language},
  journal   = {CoRR},
  volume    = {abs/2210.12810},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.12810},
  doi       = {10.48550/arXiv.2210.12810},
  eprinttype = {arXiv},
  eprint    = {2210.12810},
  timestamp = {Fri, 28 Oct 2022 14:21:57 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-12810.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords = {Program and Code Generation}
}

@inproceedings{DBLP:conf/cvpr/0002ZL0SRSPDP22,
  author    = {Zifeng Wang and
               Zizhao Zhang and
               Chen{-}Yu Lee and
               Han Zhang and
               Ruoxi Sun and
               Xiaoqi Ren and
               Guolong Su and
               Vincent Perot and
               Jennifer G. Dy and
               Tomas Pfister},
  title     = {Learning to Prompt for Continual Learning},
  booktitle = {CVPR},
  pages     = {139--149},
  publisher = {{IEEE}},
  year      = {2022},
  url       = {https://doi.org/10.1109/CVPR52688.2022.00024},
  doi       = {10.1109/CVPR52688.2022.00024},
  timestamp = {Tue, 04 Oct 2022 17:56:08 +0200},
  biburl    = {https://dblp.org/rec/conf/cvpr/0002ZL0SRSPDP22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords = {Continual Learning, Prompt Engineering}
}

@inproceedings{DBLP:conf/emnlp/Hu0X0SO22,
  author    = {Yushi Hu and
               Chia{-}Hsuan Lee and
               Tianbao Xie and
               Tao Yu and
               Noah A. Smith and
               Mari Ostendorf},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {In-Context Learning for Few-Shot Dialogue State Tracking},
  booktitle = {Findings of the Association for Computational Linguistics: {EMNLP}
               2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages     = {2627--2643},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.193},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/Hu0X0SO22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/emnlp/GuptaJYMEB22,
  author    = {Prakhar Gupta and
               Cathy Jiao and
               Yi{-}Ting Yeh and
               Shikib Mehri and
               Maxine Esk{\'{e}}nazi and
               Jeffrey P. Bigham},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {InstructDial: Improving Zero and Few-shot Generalization in Dialogue
               through Instruction Tuning},
  booktitle = {Proceedings of the 2022 Conference on Empirical Methods in Natural
               Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
               December 7-11, 2022},
  pages     = {505--525},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.33},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/GuptaJYMEB22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2210-07128,
  author    = {Aman Madaan and
               Shuyan Zhou and
               Uri Alon and
               Yiming Yang and
               Graham Neubig},
  title     = {Language Models of Code are Few-Shot Commonsense Learners},
  journal   = {CoRR},
  volume    = {abs/2210.07128},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.07128},
  doi       = {10.48550/arXiv.2210.07128},
  eprinttype = {arXiv},
  eprint    = {2210.07128},
  timestamp = {Tue, 18 Oct 2022 15:06:52 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-07128.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords = {Program and Code Generation}
}

@inproceedings{DBLP:conf/naacl/WebsonP22,
  author    = {Albert Webson and
               Ellie Pavlick},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Do Prompt-Based Models Really Understand the Meaning of Their Prompts?},
  booktitle = {NAACL},
  pages     = {2300--2344},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.167},
  doi       = {10.18653/v1/2022.naacl-main.167},
  timestamp = {Mon, 01 Aug 2022 16:28:03 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/WebsonP22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords= {Prompt Engineering}
}

@inproceedings{DBLP:conf:naacl:MinLZH22,
  author    = {Sewon Min and
               Mike Lewis and
               Luke Zettlemoyer and
               Hannaneh Hajishirzi},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {MetaICL: Learning to Learn In Context},
  booktitle = {NAACL},
  pages     = {2791--2809},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.201},
  doi       = {10.18653/v1/2022.naacl-main.201},
  timestamp = {Mon, 01 Aug 2022 16:28:01 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/MinLZH22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords= {In-Context Learning, Meta Learning},
    code={https://github.com/facebookresearch/MetaICL},
    plm={GPT-2}
}
@string(DBLP:conf:naacl:MinLZH22="MetaICL proposes a supervised meta-training framework to enable LMs to more effectively learn a new task in context. In MetaICL, each meta-training example includes several training examples from one task that will be presented together as a single sequence to the LM, and the prediction of the final example is used to calculate the loss.")

@article{DBLP:journals/corr/abs-2209-12356,
  author    = {Tanya Goyal and
               Junyi Jessy Li and
               Greg Durrett},
  title     = {News Summarization and Evaluation in the Era of {GPT-3}},
  journal   = {NeurIPS},
  volume    = {abs/2209.12356},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2209.12356},
  doi       = {10.48550/arXiv.2209.12356},
  eprinttype = {arXiv},
  eprint    = {2209.12356},
  timestamp = {Thu, 06 Oct 2022 14:41:30 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2209-12356.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals:corr:abs-2210-09338,
  author    = {Michihiro Yasunaga and
               Antoine Bosselut and
               Hongyu Ren and
               Xikun Zhang and
               Christopher D. Manning and
               Percy Liang and
               Jure Leskovec},
  title     = {Deep Bidirectional Language-Knowledge Graph Pretraining},
  journal   = {NeurIPS},
  volume    = {abs/2210.09338},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.09338},
  doi       = {10.48550/arXiv.2210.09338},
  eprinttype = {arXiv},
  eprint    = {2210.09338},
  timestamp = {Mon, 24 Oct 2022 18:10:06 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-09338.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Enhanced,Knowledge Graph Embedding}
}

@article{DBLP:journals:corr:abs-2209-01975,
  author    = {Hongjin Su and
               Jungo Kasai and
               Chen Henry Wu and
               Weijia Shi and
               Tianlu Wang and
               Jiayi Xin and
               Rui Zhang and
               Mari Ostendorf and
               Luke Zettlemoyer and
               Noah A. Smith and
               Tao Yu},
  title     = {Selective Annotation Makes Language Models Better Few-Shot Learners},
  journal   = {CoRR},
  volume    = {abs/2209.01975},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2209.01975},
  doi       = {10.48550/arXiv.2209.01975},
  eprinttype = {arXiv},
  eprint    = {2209.01975},
  timestamp = {Tue, 27 Sep 2022 08:13:21 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2209-01975.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Selective Annotation, In-Context Learning},
    code={https://github.com/HKUNLP/icl-selective-annotation},
plm={SBERT, GPT-J, GPT-Neo, GPT-3, Codex, OPT}
}
@String(DBLP:journals:corr:abs-2209-01975="This paper proposes a graph-based selective annotation method named vote-k to
(1) select a pool of examples to annotate from unlabeled data,
(2) retrieve prompts (contexts) from the annotated data pool for in-context learning.
Specifically, the selection method first selects a small set of unlabeled examples iteratively and then labels them to serve as contexts for LLMs to predict the labels of the rest unlabeled data. The method selects the predictions with highest confidence (log probability of generation output) to fill up the selective annotation pool.")

@article{DBLP:journals/pvldb/ChaiLTLL22,
  author    = {Chengliang Chai and
               Jiabin Liu and
               Nan Tang and
               Guoliang Li and
               Yuyu Luo},
  title     = {Selective Data Acquisition in the Wild for Model Charging},
  journal   = {VLDB},
  volume    = {15},
  number    = {7},
  pages     = {1466--1478},
  year      = {2022},
  url       = {https://www.vldb.org/pvldb/vol15/p1466-li.pdf},
  timestamp = {Wed, 29 Jun 2022 11:10:54 +0200},
  biburl    = {https://dblp.org/rec/journals/pvldb/ChaiLTLL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Selective Annotation}
}

@article{DBLP:journals/corr/abs-2212-09420,
  author    = {Daoguang Zan and
               Bei Chen and
               Fengji Zhang and
               Dianjie Lu and
               Bingchao Wu and
               Bei Guan and
               Yongji Wang and
               Jian{-}Guang Lou},
  title     = {When Neural Model Meets NL2Code: {A} Survey},
  journal   = {CoRR},
  volume    = {abs/2212.09420},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.09420},
  doi       = {10.48550/arXiv.2212.09420},
  eprinttype = {arXiv},
  eprint    = {2212.09420},
  timestamp = {Tue, 03 Jan 2023 15:59:43 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-09420.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Program and Code Generation, Survey}
}

@article{DBLP:journals:corr:abs-2212-13428,
  author    = {Chaoqi Zhen and
               Yanlei Shang and
               Xiangyu Liu and
               Yifei Li and
               Yong Chen and
               Dell Zhang},
  title     = {A Survey on Knowledge-Enhanced Pre-trained Language Models},
  journal   = {TKDE},
  volume    = {abs/2212.13428},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.13428},
  doi       = {10.48550/arXiv.2212.13428},
  eprinttype = {arXiv},
  eprint    = {2212.13428},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-13428.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Enhanced, Survey}
}

@article{yi2022review,
  title={Review of Knowledge-Enhanced Pre-trained Language Models},
  author={Yi, HAN and Linbo, QIAO and Dongsheng, LI and Xiangke, LIAO},
  journal={FCST},
  volume={16},
  number={7},
  pages={1439},
  year={2022},
  url={https://doi.org/10.3778/j.issn.1673-9418.2108105},
    keywords={Knowledge Enhanced}
}

@article{DBLP:journals:corr:abs-2302-04023,
  author    = {Yejin Bang and
               Samuel Cahyawijaya and
               Nayeon Lee and
               Wenliang Dai and
               Dan Su and
               Bryan Wilie and
               Holy Lovenia and
               Ziwei Ji and
               Tiezheng Yu and
               Willy Chung and
               Quyet V. Do and
               Yan Xu and
               Pascale Fung},
  title     = {A Multitask, Multilingual, Multimodal Evaluation of ChatGPT on Reasoning,
               Hallucination, and Interactivity},
  journal   = {CoRR},
  volume    = {abs/2302.04023},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.04023},
  doi       = {10.48550/arXiv.2302.04023},
  eprinttype = {arXiv},
  eprint    = {2302.04023},
  timestamp = {Fri, 10 Feb 2023 12:26:38 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-04023.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Evaluation}
}
@String(DBLP:journals:corr:abs-2302-04023="本文提出了一个使用公开数据集定量评估交互式LLM（如ChatGPT）的框架。我们使用涵盖8个不同的常见NLP应用任务的21个数据集对ChatGPT进行了广泛的技术评估。我们基于这些数据集和一个新设计的多模态数据集评估了ChatGPT的多任务、多语言和多模态方面。")

@article{DBLP:journals:corr:abs-2301-12810,
  author    = {Roi Cohen and
               Mor Geva and
               Jonathan Berant and
               Amir Globerson},
  title     = {Crawling the Internal Knowledge-Base of Language Models},
  journal   = {EACL},
  volume    = {abs/2301.12810},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.12810},
  doi       = {10.48550/arXiv.2301.12810},
  eprinttype = {arXiv},
  eprint    = {2301.12810},
  timestamp = {Wed, 01 Feb 2023 14:38:31 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-12810.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Generation}
}
@String(DBLP:journals:corr:abs-2301-12810="本文提出一种从语言模型中提取结构化知识图谱的方法；使用专门设计的提示来控制提取过程中的精度和召回率；在GPT-3上进行了评估，显示了高精确度的结果。")

@article{DBLP:journals/corr/abs-2211-09110,
  author    = {Percy Liang and
               Rishi Bommasani and
               Tony Lee and
               Dimitris Tsipras and
               Dilara Soylu and
               Michihiro Yasunaga and
               Yian Zhang and
               Deepak Narayanan and
               Yuhuai Wu and
               Ananya Kumar and
               Benjamin Newman and
               Binhang Yuan and
               Bobby Yan and
               Ce Zhang and
               Christian Cosgrove and
               Christopher D. Manning and
               Christopher R{\'{e}} and
               Diana Acosta{-}Navas and
               Drew A. Hudson and
               Eric Zelikman and
               Esin Durmus and
               Faisal Ladhak and
               Frieda Rong and
               Hongyu Ren and
               Huaxiu Yao and
               Jue Wang and
               Keshav Santhanam and
               Laurel J. Orr and
               Lucia Zheng and
               Mert Y{\"{u}}ksekg{\"{o}}n{\"{u}}l and
               Mirac Suzgun and
               Nathan Kim and
               Neel Guha and
               Niladri S. Chatterji and
               Omar Khattab and
               Peter Henderson and
               Qian Huang and
               Ryan Chi and
               Sang Michael Xie and
               Shibani Santurkar and
               Surya Ganguli and
               Tatsunori Hashimoto and
               Thomas Icard and
               Tianyi Zhang and
               Vishrav Chaudhary and
               William Wang and
               Xuechen Li and
               Yifan Mai and
               Yuhui Zhang and
               Yuta Koreeda},
  title     = {Holistic Evaluation of Language Models},
  journal   = {CoRR},
  volume    = {abs/2211.09110},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.09110},
  doi       = {10.48550/arXiv.2211.09110},
  eprinttype = {arXiv},
  eprint    = {2211.09110},
  timestamp = {Wed, 23 Nov 2022 18:03:56 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-09110.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Evaluation}
}

@article{DBLP:journals/corr/abs-2302-00923,
  author    = {Zhuosheng Zhang and
               Aston Zhang and
               Mu Li and
               Hai Zhao and
               George Karypis and
               Alex Smola},
  title     = {Multimodal Chain-of-Thought Reasoning in Language Models},
  journal   = {CoRR},
  volume    = {abs/2302.00923},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.00923},
  doi       = {10.48550/arXiv.2302.00923},
  eprinttype = {arXiv},
  eprint    = {2302.00923},
  timestamp = {Thu, 09 Feb 2023 16:11:17 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-00923.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}


@article{DBLP:journals:corr:abs-2301-00303,
  author    = {Hangfeng He and
               Hongming Zhang and
               Dan Roth},
  title     = {Rethinking with Retrieval: Faithful Large Language Model Inference},
  journal   = {CoRR},
  volume    = {abs/2301.00303},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.00303},
  doi       = {10.48550/arXiv.2301.00303},
  eprinttype = {arXiv},
  eprint    = {2301.00303},
  timestamp = {Tue, 10 Jan 2023 15:10:12 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-00303.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}
@String(DBLP:journals:corr:abs-2301-00303="本文通过用GPT-3在三个复杂的推理任务：常识推理，时间推理和表格推理上进行大量实验来评估RR的有效性。结果表明，RR可以产生更忠实的解释，并提高LLM的性能。")

@inproceedings{DBLP:conf/aaai/VilaresSSG20,
  author    = {David Vilares and
               Michalina Strzyz and
               Anders S{\o}gaard and
               Carlos G{\'{o}}mez{-}Rodr{\'{\i}}guez},
  title     = {Parsing as Pretraining},
  booktitle = {AAAI},
  pages     = {9114--9121},
  publisher = {{AAAI} Press},
  year      = {2020},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/6446},
  timestamp = {Mon, 07 Mar 2022 16:57:52 +0100},
  biburl    = {https://dblp.org/rec/conf/aaai/VilaresSSG20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Others}
}


// from Chen Yongrui

@article{DBLP:journals/corr/abs-2107-03374,
  author    = {Mark Chen and
               Jerry Tworek and
               Heewoo Jun and
               Qiming Yuan and
               Henrique Pond{\'{e}} de Oliveira Pinto and
               Jared Kaplan and
               Harrison Edwards and
               Yuri Burda and
               Nicholas Joseph and
               Greg Brockman and
               Alex Ray and
               Raul Puri and
               Gretchen Krueger and
               Michael Petrov and
               Heidy Khlaaf and
               Girish Sastry and
               Pamela Mishkin and
               Brooke Chan and
               Scott Gray and
               Nick Ryder and
               Mikhail Pavlov and
               Alethea Power and
               Lukasz Kaiser and
               Mohammad Bavarian and
               Clemens Winter and
               Philippe Tillet and
               Felipe Petroski Such and
               Dave Cummings and
               Matthias Plappert and
               Fotios Chantzis and
               Elizabeth Barnes and
               Ariel Herbert{-}Voss and
               William Hebgen Guss and
               Alex Nichol and
               Alex Paino and
               Nikolas Tezak and
               Jie Tang and
               Igor Babuschkin and
               Suchir Balaji and
               Shantanu Jain and
               William Saunders and
               Christopher Hesse and
               Andrew N. Carr and
               Jan Leike and
               Joshua Achiam and
               Vedant Misra and
               Evan Morikawa and
               Alec Radford and
               Matthew Knight and
               Miles Brundage and
               Mira Murati and
               Katie Mayer and
               Peter Welinder and
               Bob McGrew and
               Dario Amodei and
               Sam McCandlish and
               Ilya Sutskever and
               Wojciech Zaremba},
  title     = {Evaluating Large Language Models Trained on Code},
  journal   = {CoRR},
  volume    = {abs/2107.03374},
  year      = {2021},
  url       = {https://arxiv.org/abs/2107.03374},
  eprinttype = {arXiv},
  eprint    = {2107.03374},
  timestamp = {Thu, 09 Feb 2023 14:04:35 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2107-03374.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Evaluation, Program and Code Generation}
}

@article{DBLP:journals/corr/abs-2301-12868,
  author    = {Terry Yue Zhuo and
               Zhuang Li and
               Yujin Huang and
               Yuan{-}Fang Li and
               Weiqing Wang and
               Gholamreza Haffari and
               Fatemeh Shiri},
  title     = {On Robustness of Prompt-based Semantic Parsing with Large Pre-trained
               Language Model: An Empirical Study on Codex},
  journal   = {CoRR},
  volume    = {abs/2301.12868},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.12868},
  doi       = {10.48550/arXiv.2301.12868},
  eprinttype = {arXiv},
  eprint    = {2301.12868},
  timestamp = {Fri, 03 Feb 2023 10:27:08 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-12868.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering, Program and Code Generation}
}

@inproceedings{DBLP:conf/iclr/LiuSPGSKS18,
  author    = {Peter J. Liu and
               Mohammad Saleh and
               Etienne Pot and
               Ben Goodrich and
               Ryan Sepassi and
               Lukasz Kaiser and
               Noam Shazeer},
  title     = {Generating Wikipedia by Summarizing Long Sequences},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2018},
  url       = {https://openreview.net/forum?id=Hyg0vbWC-},
  timestamp = {Thu, 25 Jul 2019 14:25:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/LiuSPGSKS18.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{radford2018improving,
  title={Improving language understanding by generative pre-training},
  author={Radford, Alec and Narasimhan, Karthik and Salimans, Tim and Sutskever, Ilya and others},
    url = {https://cdn.openai.com/research-covers/language-unsupervised/language_understanding_paper.pdf},
    year = {2018},
    booktitle = {OpenAI},
    keywords = {AIGC, Natural Language Understanding, Pre-Training Techniques},
    plm={GPT-1}
}

@article{radfordlanguage,
  title={Language Models are Unsupervised Multitask Learners},
  author={Radford, Alec and Wu, Jeffrey and Child, Rewon and Luan, David and Amodei, Dario and Sutskever, Ilya},
    url = {https://cdn.openai.com/better-language-models/language_models_are_unsupervised_multitask_learners.pdf},
    year = {2019},
    booktitle = {OpenAI},
    plm ={GPT-2},
    keywords = {AIGC, Pre-Training Techniques}
}

@inproceedings{DBLP:conf/nips/BrownMRSKDNSSAA20,
  author    = {Tom B. Brown and
               Benjamin Mann and
               Nick Ryder and
               Melanie Subbiah and
               Jared Kaplan and
               Prafulla Dhariwal and
               Arvind Neelakantan and
               Pranav Shyam and
               Girish Sastry and
               Amanda Askell and
               Sandhini Agarwal and
               Ariel Herbert{-}Voss and
               Gretchen Krueger and
               Tom Henighan and
               Rewon Child and
               Aditya Ramesh and
               Daniel M. Ziegler and
               Jeffrey Wu and
               Clemens Winter and
               Christopher Hesse and
               Mark Chen and
               Eric Sigler and
               Mateusz Litwin and
               Scott Gray and
               Benjamin Chess and
               Jack Clark and
               Christopher Berner and
               Sam McCandlish and
               Alec Radford and
               Ilya Sutskever and
               Dario Amodei},
  editor    = {Hugo Larochelle and
               Marc'Aurelio Ranzato and
               Raia Hadsell and
               Maria{-}Florina Balcan and
               Hsuan{-}Tien Lin},
  title     = {Language Models are Few-Shot Learners},
  booktitle = {NeurIPS},
  year      = {2020},
  url       = {https://proceedings.neurips.cc/paper/2020/hash/1457c0d6bfcb4967418bfb8ac142f64a-Abstract.html},
  timestamp = {Tue, 19 Jan 2021 15:56:50 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/BrownMRSKDNSSAA20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques, AIGC},
  plm={GPT-3}
}

@article{DBLP:journals:corr:abs-2301-00234,
  author    = {Qingxiu Dong and
               Lei Li and
               Damai Dai and
               Ce Zheng and
               Zhiyong Wu and
               Baobao Chang and
               Xu Sun and
               Jingjing Xu and
               Lei Li and
               Zhifang Sui},
  title     = {A Survey for In-context Learning},
  journal   = {CoRR},
  volume    = {abs/2301.00234},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.00234},
  doi       = {10.48550/arXiv.2301.00234},
  eprinttype = {arXiv},
  eprint    = {2301.00234},
  timestamp = {Tue, 10 Jan 2023 15:10:12 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-00234.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning, Survey}
}
@String(DBLP:journals:corr:abs-2301-00234="This paper surveys and summarizes the progress and challenges of ICL, including ICL's formal definition, correlation to related studies, advanced techniques (training strategies, related analysis) and potential directions.")

@inproceedings{DBLP:conf:naacl:ChenDPMISK22,
  author    = {Mingda Chen and
               Jingfei Du and
               Ramakanth Pasunuru and
               Todor Mihaylov and
               Srini Iyer and
               Veselin Stoyanov and
               Zornitsa Kozareva},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Improving In-Context Few-Shot Learning via Self-Supervised Training},
  booktitle = {NAACL},
  pages     = {3558--3573},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.260},
  doi       = {10.18653/v1/2022.naacl-main.260},
  timestamp = {Mon, 01 Aug 2022 16:27:58 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/ChenDPMISK22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning},
    plm={MoE}
}
@string(DBLP:conf:naacl:ChenDPMISK22="This paper proposes to use self-supervision (MLM, NSP, CL, etc.) between pre-training and downstream usage to teach the LM to perform in-context learning. Analysis reveals that:
(1) benefits of self-supervised depends on the amount of training data,
(2) semantic similarity between training and evaluation tasks matters,
(3) adding training objectives without diversity does not help,
(4) model performance improves when choosing similar templates for both self-supervised and downstream tasks,
(5) self-supervised  tasks and human-annotated datasets are complementary,
(6) self-supervised-trained models are better at following task instructions.")

@inproceedings{DBLP:conf/iclr/WeiBZGYLDDL22,
  author    = {Jason Wei and
               Maarten Bosma and
               Vincent Y. Zhao and
               Kelvin Guu and
               Adams Wei Yu and
               Brian Lester and
               Nan Du and
               Andrew M. Dai and
               Quoc V. Le},
  title     = {Finetuned Language Models are Zero-Shot Learners},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2022},
  url       = {https://openreview.net/forum?id=gEZrGCozdqR},
  timestamp = {Sat, 20 Aug 2022 01:15:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/WeiBZGYLDDL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Instruction Tuning}
}

@article{DBLP:journals/corr/abs-2201-08239,
  author    = {Romal Thoppilan and
               Daniel De Freitas and
               Jamie Hall and
               Noam Shazeer and
               Apoorv Kulshreshtha and
               Heng{-}Tze Cheng and
               Alicia Jin and
               Taylor Bos and
               Leslie Baker and
               Yu Du and
               YaGuang Li and
               Hongrae Lee and
               Huaixiu Steven Zheng and
               Amin Ghafouri and
               Marcelo Menegali and
               Yanping Huang and
               Maxim Krikun and
               Dmitry Lepikhin and
               James Qin and
               Dehao Chen and
               Yuanzhong Xu and
               Zhifeng Chen and
               Adam Roberts and
               Maarten Bosma and
               Yanqi Zhou and
               Chung{-}Ching Chang and
               Igor Krivokon and
               Will Rusch and
               Marc Pickett and
               Kathleen S. Meier{-}Hellstern and
               Meredith Ringel Morris and
               Tulsee Doshi and
               Renelito Delos Santos and
               Toju Duke and
               Johnny Soraker and
               Ben Zevenbergen and
               Vinodkumar Prabhakaran and
               Mark Diaz and
               Ben Hutchinson and
               Kristen Olson and
               Alejandra Molina and
               Erin Hoffman{-}John and
               Josh Lee and
               Lora Aroyo and
               Ravi Rajakumar and
               Alena Butryna and
               Matthew Lamm and
               Viktoriya Kuzmina and
               Joe Fenton and
               Aaron Cohen and
               Rachel Bernstein and
               Ray Kurzweil and
               Blaise Aguera{-}Arcas and
               Claire Cui and
               Marian Croak and
               Ed H. Chi and
               Quoc Le},
  title     = {LaMDA: Language Models for Dialog Applications},
  journal   = {CoRR},
  volume    = {abs/2201.08239},
  year      = {2022},
  url       = {https://arxiv.org/abs/2201.08239},
  eprinttype = {arXiv},
  eprint    = {2201.08239},
  timestamp = {Fri, 22 Apr 2022 16:06:31 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2201-08239.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Instruction Tuning}
}

@article{DBLP:journals/corr/abs-2210-11416,
  author    = {Hyung Won Chung and
               Le Hou and
               Shayne Longpre and
               Barret Zoph and
               Yi Tay and
               William Fedus and
               Eric Li and
               Xuezhi Wang and
               Mostafa Dehghani and
               Siddhartha Brahma and
               Albert Webson and
               Shixiang Shane Gu and
               Zhuyun Dai and
               Mirac Suzgun and
               Xinyun Chen and
               Aakanksha Chowdhery and
               Sharan Narang and
               Gaurav Mishra and
               Adams Yu and
               Vincent Y. Zhao and
               Yanping Huang and
               Andrew M. Dai and
               Hongkun Yu and
               Slav Petrov and
               Ed H. Chi and
               Jeff Dean and
               Jacob Devlin and
               Adam Roberts and
               Denny Zhou and
               Quoc V. Le and
               Jason Wei},
  title     = {Scaling Instruction-Finetuned Language Models},
  journal   = {CoRR},
  volume    = {abs/2210.11416},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.11416},
  doi       = {10.48550/arXiv.2210.11416},
  eprinttype = {arXiv},
  eprint    = {2210.11416},
  timestamp = {Wed, 26 Oct 2022 08:16:51 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-11416.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Instruction Tuning}
}

@inproceedings{DBLP:conf/emnlp/WangMAKMNADASPK22,
  author    = {Yizhong Wang and
               Swaroop Mishra and
               Pegah Alipoormolabashi and
               Yeganeh Kordi and
               Amirreza Mirzaei and
               Atharva Naik and
               Arjun Ashok and
               Arut Selvan Dhanasekaran and
               Anjana Arunkumar and
               David Stap and
               Eshaan Pathak and
               Giannis Karamanolakis and
               Haizhi Gary Lai and
               Ishan Purohit and
               Ishani Mondal and
               Jacob Anderson and
               Kirby Kuznia and
               Krima Doshi and
               Kuntal Kumar Pal and
               Maitreya Patel and
               Mehrad Moradshahi and
               Mihir Parmar and
               Mirali Purohit and
               Neeraj Varshney and
               Phani Rohitha Kaza and
               Pulkit Verma and
               Ravsehaj Singh Puri and
               Rushang Karia and
               Savan Doshi and
               Shailaja Keyur Sampat and
               Siddhartha Mishra and
               Sujan Reddy A and
               Sumanta Patro and
               Tanay Dixit and
               Xudong Shen},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Super-NaturalInstructions: Generalization via Declarative Instructions
               on 1600+ {NLP} Tasks},
  booktitle = {EMNLP},
  pages     = {5085--5109},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.340},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/WangMAKMNADASPK22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Instruction Tuning}
}

@article{DBLP:journals:corr:abs-2205-10782,
  author    = {Or Honovich and
               Uri Shaham and
               Samuel R. Bowman and
               Omer Levy},
  title     = {Instruction Induction: From Few Examples to Natural Language Task
               Descriptions},
  journal   = {CoRR},
  volume    = {abs/2205.10782},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2205.10782},
  doi       = {10.48550/arXiv.2205.10782},
  eprinttype = {arXiv},
  eprint    = {2205.10782},
  timestamp = {Mon, 09 Jan 2023 08:11:56 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2205-10782.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning, Chain of Thought},
}
@String(DBLP:journals:corr:abs-2205-10782="(1) 探索了利用LLM在几个样本的情况下归纳出任务指令的能力；
(2) 测量两个指标：1. 模型归纳指令与人类归纳的指令对比，2. 利用模型归纳的指令作为prompt进行预测的执行准确率；
(3) 相比于GPT-3，InstructGPT效果更好，理所当然。")

@article{DBLP:journals/corr/abs-2211-01910,
  author    = {Yongchao Zhou and
               Andrei Ioan Muresanu and
               Ziwen Han and
               Keiran Paster and
               Silviu Pitis and
               Harris Chan and
               Jimmy Ba},
  title     = {Large Language Models Are Human-Level Prompt Engineers},
  journal   = {CoRR},
  volume    = {abs/2211.01910},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.01910},
  doi       = {10.48550/arXiv.2211.01910},
  eprinttype = {arXiv},
  eprint    = {2211.01910},
  timestamp = {Fri, 04 Nov 2022 13:48:49 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-01910.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2212-10560,
  author    = {Yizhong Wang and
               Yeganeh Kordi and
               Swaroop Mishra and
               Alisa Liu and
               Noah A. Smith and
               Daniel Khashabi and
               Hannaneh Hajishirzi},
  title     = {Self-Instruct: Aligning Language Model with Self Generated Instructions},
  journal   = {CoRR},
  volume    = {abs/2212.10560},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10560},
  doi       = {10.48550/arXiv.2212.10560},
  eprinttype = {arXiv},
  eprint    = {2212.10560},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10560.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Instruction Tuning}
}

@inproceedings{DBLP:conf:emnlp:Wang0S22,
  author    = {Boshi Wang and
               Xiang Deng and
               Huan Sun},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Iteratively Prompt Pre-trained Language Models for Chain of Thought},
  booktitle = {EMNLP},
  pages     = {2714--2730},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.174},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/Wang0S22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought},
}
@String(DBLP:conf:emnlp:Wang0S22="(1) 提出了一种迭代式的prompt-tuning方法，他们认为soft prompt应该带有语境，即在自回归解码时不同时刻应该有不同的prompt向量；
(2) 利用BERT为encoder-decoder架构的PLM生成prompt，在每个解码时刻BERT都会根据先前时刻的上下文生成一组新的prompt向量，提供给PLM生成新的上下文，迭代往复。")


@article{DBLP:journals/corr/abs-2210-00720,
  author    = {Yao Fu and
               Hao Peng and
               Ashish Sabharwal and
               Peter Clark and
               Tushar Khot},
  title     = {Complexity-Based Prompting for Multi-Step Reasoning},
  journal   = {CoRR},
  volume    = {abs/2210.00720},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.00720},
  doi       = {10.48550/arXiv.2210.00720},
  eprinttype = {arXiv},
  eprint    = {2210.00720},
  timestamp = {Fri, 07 Oct 2022 15:24:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-00720.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2210-03350,
  author    = {Ofir Press and
               Muru Zhang and
               Sewon Min and
               Ludwig Schmidt and
               Noah A. Smith and
               Mike Lewis},
  title     = {Measuring and Narrowing the Compositionality Gap in Language Models},
  journal   = {CoRR},
  volume    = {abs/2210.03350},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.03350},
  doi       = {10.48550/arXiv.2210.03350},
  eprinttype = {arXiv},
  eprint    = {2210.03350},
  timestamp = {Wed, 12 Oct 2022 14:25:15 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-03350.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2210-03493,
  author    = {Zhuosheng Zhang and
               Aston Zhang and
               Mu Li and
               Alex Smola},
  title     = {Automatic Chain of Thought Prompting in Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2210.03493},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.03493},
  doi       = {10.48550/arXiv.2210.03493},
  eprinttype = {arXiv},
  eprint    = {2210.03493},
  timestamp = {Fri, 10 Feb 2023 11:02:20 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-03493.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}

@inproceedings{DBLP:conf:acl:LuBM0S22,
  author    = {Yao Lu and
               Max Bartolo and
               Alastair Moore and
               Sebastian Riedel and
               Pontus Stenetorp},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Fantastically Ordered Prompts and Where to Find Them: Overcoming Few-Shot
               Prompt Order Sensitivity},
  booktitle = {ACL},
  pages     = {8086--8098},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.556},
  doi       = {10.18653/v1/2022.acl-long.556},
  timestamp = {Mon, 01 Aug 2022 16:27:50 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/LuBM0S22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning},
    plm={GPT-2, GPT-3}
}
@string(DBLP:conf:acl:LuBM0S22="(1) This work demonstrates that few-shot prompts suffer from order sensitivity, in that for the same prompt the order in which samples are provided can make a difference to model performance.
(2) This work introduces a probing method which constructs an artificial development set by language models themselves to alleviate the order sensitivity problem.")


@inproceedings{DBLP:conf:naacl:RubinHB22,
  author    = {Ohad Rubin and
               Jonathan Herzig and
               Jonathan Berant},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Learning To Retrieve Prompts for In-Context Learning},
  booktitle = {NAACL},
  pages     = {2655--2671},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.191},
  doi       = {10.18653/v1/2022.naacl-main.191},
  timestamp = {Mon, 01 Aug 2022 16:27:57 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/RubinHB22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning},
    plm={GPT-3, GPT-Neo, Codex, GPT-J, SBERT, BERT}
}
@String(DBLP:conf:naacl:RubinHB22="This paper proposes a method to retrieve good contexts for in-context learning. Specifically, the method
(1) uses an unsupervised retriever (BM25/SBERT) to obtain a set of context candidates,
(2) passes the candidates to a scoring model (GPT-Neo/GPT-J/GPT-3/Codex) and select the top/bottom k as positive/negative examples,
(3) uses the examples to train a dense retriever (BERT-based).")


@inproceedings{DBLP:conf:emnlp:ZhangFT22,
  author    = {Yiming Zhang and
               Shi Feng and
               Chenhao Tan},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Active Example Selection for In-Context Learning},
  booktitle = {EMNLP},
  pages     = {9134--9148},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.622},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ZhangFT22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning},
    code={https://github.com/ChicagoHAI/active-example-selection},
    plm={GPT-2, GPT-3}
}
@String(DBLP:conf:emnlp:ZhangFT22="(1) This paper revisits the  effect of example selection (re-ordering & calibration) for ICL, observing that a large variance across set of demonstration examples still exists.
(2) This paper applies reinforcement learning (Q-Learning) to optimize example selection by formulating this task as sequential decision-making problem, which is appropriate for example selection from unlabeled datasets. ")

@inproceedings{DBLP:conf/acl/SorensenRRSRDKF22,
  author    = {Taylor Sorensen and
               Joshua Robinson and
               Christopher Michael Rytting and
               Alexander Glenn Shaw and
               Kyle Jeffrey Rogers and
               Alexia Pauline Delorey and
               Mahmoud Khalil and
               Nancy Fulda and
               David Wingate},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {An Information-theoretic Approach to Prompt Engineering Without Ground
               Truth Labels},
  booktitle = {ACL},
  pages     = {819--862},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.60},
  doi       = {10.18653/v1/2022.acl-long.60},
  timestamp = {Mon, 01 Aug 2022 16:27:52 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/SorensenRRSRDKF22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2206-08082,
  author    = {Hyuhng Joon Kim and
               Hyunsoo Cho and
               Junyeob Kim and
               Taeuk Kim and
               Kang Min Yoo and
               Sang{-}goo Lee},
  title     = {Self-Generated In-Context Learning: Leveraging Auto-regressive Language
               Models as a Demonstration Generator},
  journal   = {CoRR},
  volume    = {abs/2206.08082},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2206.08082},
  doi       = {10.48550/arXiv.2206.08082},
  eprinttype = {arXiv},
  eprint    = {2206.08082},
  timestamp = {Tue, 21 Jun 2022 17:35:15 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2206-08082.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning}
}

@article{DBLP:journals/corr/abs-2212-04037,
  author    = {Hila Gonen and
               Srini Iyer and
               Terra Blevins and
               Noah A. Smith and
               Luke Zettlemoyer},
  title     = {Demystifying Prompts in Language Models via Perplexity Estimation},
  journal   = {CoRR},
  volume    = {abs/2212.04037},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.04037},
  doi       = {10.48550/arXiv.2212.04037},
  eprinttype = {arXiv},
  eprint    = {2212.04037},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-04037.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/isola/AlbertsG22,
  author    = {Elvin Alberts and
               Ilias Gerostathopoulos},
  editor    = {Tiziana Margaria and
               Bernhard Steffen},
  title     = {Measuring Convergence Inertia: Online Learning in Self-adaptive Systems
               with Context Shifts},
  booktitle = {ISoLA},
  series    = {Lecture Notes in Computer Science},
  volume    = {13703},
  pages     = {231--248},
  publisher = {Springer},
  year      = {2022},
  url       = {https://doi.org/10.1007/978-3-031-19759-8\_15},
  doi       = {10.1007/978-3-031-19759-8\_15},
  timestamp = {Wed, 07 Dec 2022 23:13:48 +0100},
  biburl    = {https://dblp.org/rec/conf/isola/AlbertsG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning}
}

@article{DBLP:journals/corr/abs-2201-11903,
  author    = {Jason Wei and
               Xuezhi Wang and
               Dale Schuurmans and
               Maarten Bosma and
               Ed H. Chi and
               Quoc Le and
               Denny Zhou},
  title     = {Chain of Thought Prompting Elicits Reasoning in Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2201.11903},
  year      = {2022},
  url       = {https://arxiv.org/abs/2201.11903},
  eprinttype = {arXiv},
  eprint    = {2201.11903},
  timestamp = {Fri, 22 Apr 2022 16:06:31 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2201-11903.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2203-11171,
  author    = {Xuezhi Wang and
               Jason Wei and
               Dale Schuurmans and
               Quoc V. Le and
               Ed H. Chi and
               Denny Zhou},
  title     = {Self-Consistency Improves Chain of Thought Reasoning in Language Models},
  journal   = {CoRR},
  volume    = {abs/2203.11171},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2203.11171},
  doi       = {10.48550/arXiv.2203.11171},
  eprinttype = {arXiv},
  eprint    = {2203.11171},
  timestamp = {Fri, 22 Apr 2022 16:06:32 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2203-11171.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Chain of Thought}
}

@inproceedings{DBLP:conf/acl/LoganBWP0022,
  author    = {Robert L. Logan IV and
               Ivana Balazevic and
               Eric Wallace and
               Fabio Petroni and
               Sameer Singh and
               Sebastian Riedel},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Cutting Down on Prompts and Parameters: Simple Few-Shot Learning with
               Language Models},
  booktitle = {ACL Findings},
  pages     = {2824--2835},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.findings-acl.222},
  doi       = {10.18653/v1/2022.findings-acl.222},
  timestamp = {Mon, 01 Aug 2022 16:27:44 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/LoganBWP0022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/emnlp/ChadaN21,
  author    = {Rakesh Chada and
               Pradeep Natarajan},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {FewshotQA: {A} simple framework for few-shot learning of question
               answering tasks using pre-trained text-to-text models},
  booktitle = {EMNLP},
  pages     = {6081--6090},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.491},
  doi       = {10.18653/v1/2021.emnlp-main.491},
  timestamp = {Thu, 20 Jan 2022 10:02:34 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ChadaN21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering, AIGC}
}

@inproceedings{DBLP:conf/emnlp/LesterAC21,
  author    = {Brian Lester and
               Rami Al{-}Rfou and
               Noah Constant},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {The Power of Scale for Parameter-Efficient Prompt Tuning},
  booktitle = {EMNLP},
  pages     = {3045--3059},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.243},
  doi       = {10.18653/v1/2021.emnlp-main.243},
  timestamp = {Wed, 16 Mar 2022 23:55:07 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/LesterAC21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/acl/WuS22,
  author    = {Hui Wu and
               Xiaodong Shi},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Adversarial Soft Prompt Tuning for Cross-Domain Sentiment Analysis},
  booktitle = {ACL},
  pages     = {2438--2447},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.174},
  doi       = {10.18653/v1/2022.acl-long.174},
  timestamp = {Wed, 07 Dec 2022 23:10:02 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/WuS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2204-00498,
  author    = {Nitarshan Rajkumar and
               Raymond Li and
               Dzmitry Bahdanau},
  title     = {Evaluating the Text-to-SQL Capabilities of Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2204.00498},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2204.00498},
  doi       = {10.48550/arXiv.2204.00498},
  eprinttype = {arXiv},
  eprint    = {2204.00498},
  timestamp = {Wed, 06 Apr 2022 14:29:31 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2204-00498.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords = {Evaluation, Program and Code Generation}
}

@inproceedings{DBLP:conf/acl/CarlssonOLVNS22,
  author    = {Fredrik Carlsson and
               Joey {\"{O}}hman and
               Fangyu Liu and
               Severine Verlinden and
               Joakim Nivre and
               Magnus Sahlgren},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Fine-Grained Controllable Text Generation Using Non-Residual Prompting},
  booktitle = {ACL},
  pages     = {6837--6857},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.471},
  doi       = {10.18653/v1/2022.acl-long.471},
  timestamp = {Mon, 01 Aug 2022 16:27:52 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/CarlssonOLVNS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering, AIGC}
}

@inproceedings{DBLP:conf/acl/TanZW022,
  author    = {Zhixing Tan and
               Xiangwen Zhang and
               Shuo Wang and
               Yang Liu},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {{MSP:} Multi-Stage Prompting for Making Pre-trained Language Models
               Better Translators},
  booktitle = {ACL},
  pages     = {6131--6142},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.424},
  doi       = {10.18653/v1/2022.acl-long.424},
  timestamp = {Mon, 01 Aug 2022 16:27:47 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/TanZW022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/acl/MinLHZ22,
  author    = {Sewon Min and
               Mike Lewis and
               Hannaneh Hajishirzi and
               Luke Zettlemoyer},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Noisy Channel Language Model Prompting for Few-Shot Text Classification},
  booktitle = {ACL},
  pages     = {5316--5330},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.365},
  doi       = {10.18653/v1/2022.acl-long.365},
  timestamp = {Mon, 01 Aug 2022 16:27:50 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/MinLHZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/acl/VuLCAC22,
  author    = {Tu Vu and
               Brian Lester and
               Noah Constant and
               Rami Al{-}Rfou' and
               Daniel Cer},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {SPoT: Better Frozen Model Adaptation through Soft Prompt Transfer},
  booktitle = {ACL},
  pages     = {5039--5059},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.346},
  doi       = {10.18653/v1/2022.acl-long.346},
  timestamp = {Mon, 01 Aug 2022 16:27:45 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/VuLCAC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}


// from Zhai Songlin

@article{DBLP:journals/pami/LangeAMPJLST22,
  author    = {Matthias De Lange and
               Rahaf Aljundi and
               Marc Masana and
               Sarah Parisot and
               Xu Jia and
               Ales Leonardis and
               Gregory G. Slabaugh and
               Tinne Tuytelaars},
  title     = {A Continual Learning Survey: Defying Forgetting in Classification
               Tasks},
  journal   = {T-PAMI},
  volume    = {44},
  number    = {7},
  pages     = {3366--3385},
  year      = {2022},
  url       = {https://doi.org/10.1109/TPAMI.2021.3057446},
  doi       = {10.1109/TPAMI.2021.3057446},
  timestamp = {Tue, 28 Jun 2022 21:07:49 +0200},
  biburl    = {https://dblp.org/rec/journals/pami/LangeAMPJLST22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Continual Learning, Survey}
}

@inproceedings{DBLP:conf/acl/QinZLL0SZ22,
  author    = {Yujia Qin and
               Jiajie Zhang and
               Yankai Lin and
               Zhiyuan Liu and
               Peng Li and
               Maosong Sun and
               Jie Zhou},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {{ELLE:} Efficient Lifelong Pre-training for Emerging Data},
  booktitle = {ACL Findings},
  pages     = {2789--2810},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.findings-acl.220},
  doi       = {10.18653/v1/2022.findings-acl.220},
  timestamp = {Thu, 13 Oct 2022 12:53:05 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/QinZLL0SZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Continual Learning}
}

@inproceedings{DBLP:conf/iclr/XieRL022,
  author    = {Sang Michael Xie and
               Aditi Raghunathan and
               Percy Liang and
               Tengyu Ma},
  title     = {An Explanation of In-context Learning as Implicit Bayesian Inference},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2022},
  url       = {https://openreview.net/forum?id=RdJVFCHjUMI},
  timestamp = {Sat, 20 Aug 2022 01:15:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/XieRL022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning}
}

@article{DBLP:journals/corr/abs-2203-06904,
  author    = {Ning Ding and
               Yujia Qin and
               Guang Yang and
               Fuchao Wei and
               Zonghan Yang and
               Yusheng Su and
               Shengding Hu and
               Yulin Chen and
               Chi{-}Min Chan and
               Weize Chen and
               Jing Yi and
               Weilin Zhao and
               Xiaozhi Wang and
               Zhiyuan Liu and
               Hai{-}Tao Zheng and
               Jianfei Chen and
               Yang Liu and
               Jie Tang and
               Juanzi Li and
               Maosong Sun},
  title     = {Delta Tuning: {A} Comprehensive Study of Parameter Efficient Methods
               for Pre-trained Language Models},
  journal   = {CoRR},
  volume    = {abs/2203.06904},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2203.06904},
  doi       = {10.48550/arXiv.2203.06904},
  eprinttype = {arXiv},
  eprint    = {2203.06904},
  timestamp = {Tue, 24 Jan 2023 15:06:31 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2203-06904.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/emnlp/MinLHALHZ22,
  author    = {Sewon Min and
               Xinxi Lyu and
               Ari Holtzman and
               Mikel Artetxe and
               Mike Lewis and
               Hannaneh Hajishirzi and
               Luke Zettlemoyer},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Rethinking the Role of Demonstrations: What Makes In-Context Learning
               Work?},
  booktitle = {EMNLP},
  pages     = {11048--11064},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.759},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/MinLHALHZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={In-Context Learning}
}

@inproceedings{DBLP:conf/naacl/JinZZ00WA022,
  author    = {Xisen Jin and
               Dejiao Zhang and
               Henghui Zhu and
               Wei Xiao and
               Shang{-}Wen Li and
               Xiaokai Wei and
               Andrew O. Arnold and
               Xiang Ren},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Lifelong Pretraining: Continually Adapting Language Models to Emerging
               Corpora},
  booktitle = {NAACL},
  pages     = {4764--4780},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.351},
  doi       = {10.18653/v1/2022.naacl-main.351},
  timestamp = {Mon, 01 Aug 2022 16:27:59 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/JinZZ00WA022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Continual Learning}
}

@inproceedings{DBLP:conf/automl/BansalAWLM22,
  author    = {Trapit Bansal and
               Salaheddin Alzubi and
               Tong Wang and
               Jay{-}Yoon Lee and
               Andrew McCallum},
  editor    = {Isabelle Guyon and
               Marius Lindauer and
               Mihaela van der Schaar and
               Frank Hutter and
               Roman Garnett},
  title     = {Meta-Adapters: Parameter Efficient Few-shot Fine-tuning through Meta-Learning},
  booktitle = {AutoML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {188},
  pages     = {19/1--18},
  publisher = {{PMLR}},
  year      = {2022},
  url       = {https://proceedings.mlr.press/v188/bansal22a.html},
  timestamp = {Mon, 28 Nov 2022 12:30:36 +0100},
  biburl    = {https://dblp.org/rec/conf/automl/BansalAWLM22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@inproceedings{
hu2022sparse,
title={Sparse Structure Search for Delta Tuning},
author={Shengding Hu and Zhen Zhang and Ning Ding and Yadao Wang and Yasheng Wang and Zhiyuan Liu and Maosong Sun},
booktitle={NeurIPS},
year={2022},
url={https://openreview.net/forum?id=oOte_397Q4P},
    keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/www/YeZDCCXCC22,
  author    = {Hongbin Ye and
               Ningyu Zhang and
               Shumin Deng and
               Xiang Chen and
               Hui Chen and
               Feiyu Xiong and
               Xi Chen and
               Huajun Chen},
  editor    = {Fr{\'{e}}d{\'{e}}rique Laforest and
               Rapha{\"{e}}l Troncy and
               Elena Simperl and
               Deepak Agarwal and
               Aristides Gionis and
               Ivan Herman and
               Lionel M{\'{e}}dini},
  title     = {Ontology-enhanced Prompt-tuning for Few-shot Learning},
  booktitle = {WWW},
  pages     = {778--787},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3485447.3511921},
  doi       = {10.1145/3485447.3511921},
  timestamp = {Wed, 28 Dec 2022 16:23:40 +0100},
  biburl    = {https://dblp.org/rec/conf/www/YeZDCCXCC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}


@article{DBLP:journals/corr/abs-2212-06950,
  author    = {Xuandong Zhao and
               Siqi Ouyang and
               Zhiguo Yu and
               Ming Wu and
               Lei Li},
  title     = {Pre-trained Language Models can be Fully Zero-Shot Learners},
  journal   = {CoRR},
  volume    = {abs/2212.06950},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.06950},
  doi       = {10.48550/arXiv.2212.06950},
  eprinttype = {arXiv},
  eprint    = {2212.06950},
  timestamp = {Sat, 04 Feb 2023 01:14:59 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-06950.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Prompt Engineering}
}

@article{DBLP:journals/jair/KhetarpalRRP22,
  author    = {Khimya Khetarpal and
               Matthew Riemer and
               Irina Rish and
               Doina Precup},
  title     = {Towards Continual Reinforcement Learning: {A} Review and Perspectives},
  journal   = {JAIR},
  volume    = {75},
  pages     = {1401--1476},
  year      = {2022},
  url       = {https://doi.org/10.1613/jair.1.13673},
  doi       = {10.1613/jair.1.13673},
  timestamp = {Thu, 05 Jan 2023 17:22:32 +0100},
  biburl    = {https://dblp.org/rec/journals/jair/KhetarpalRRP22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Continual Learning}
}

@inproceedings{DBLP:conf/aaai/Huang0GZ20,
  author    = {Jiabo Huang and
               Qi Dong and
               Shaogang Gong and
               Xiatian Zhu},
  title     = {Unsupervised Deep Learning via Affinity Diffusion},
  booktitle = {AAAI},
  pages     = {11029--11036},
  publisher = {{AAAI} Press},
  year      = {2020},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/6757},
  timestamp = {Mon, 07 Mar 2022 16:58:02 +0100},
  biburl    = {https://dblp.org/rec/conf/aaai/Huang0GZ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Others}
}

@article{DBLP:journals/corr/abs-2212-12990,
  author    = {Zijian Zhang and
               Zhou Zhao and
               Zhijie Lin},
  title     = {Unsupervised Representation Learning from Pre-trained Diffusion Probabilistic
               Models},
  journal   = {NeurIPS},
  volume    = {abs/2212.12990},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.12990},
  doi       = {10.48550/arXiv.2212.12990},
  eprinttype = {arXiv},
  eprint    = {2212.12990},
  timestamp = {Thu, 05 Jan 2023 09:37:44 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-12990.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Others}
}

@inproceedings{DBLP:conf/nips/PalatucciPHM09,
  author    = {Mark Palatucci and
               Dean Pomerleau and
               Geoffrey E. Hinton and
               Tom M. Mitchell},
  editor    = {Yoshua Bengio and
               Dale Schuurmans and
               John D. Lafferty and
               Christopher K. I. Williams and
               Aron Culotta},
  title     = {Zero-shot Learning with Semantic Output Codes},
  booktitle = {NeurIPS},
  pages     = {1410--1418},
  publisher = {Curran Associates, Inc.},
  year      = {2009},
  url       = {https://proceedings.neurips.cc/paper/2009/hash/1543843a4723ed2ab08e18053ae6dc5b-Abstract.html},
  timestamp = {Mon, 16 May 2022 15:41:51 +0200},
  biburl    = {https://dblp.org/rec/conf/nips/PalatucciPHM09.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Enhanced}
}

@inproceedings{DBLP:conf/cvpr/LampertNH09,
  author    = {Christoph H. Lampert and
               Hannes Nickisch and
               Stefan Harmeling},
  title     = {Learning to detect unseen object classes by between-class attribute
               transfer},
  booktitle = {CVPR},
  pages     = {951--958},
  publisher = {{IEEE} Computer Society},
  year      = {2009},
  url       = {https://doi.org/10.1109/CVPR.2009.5206594},
  doi       = {10.1109/CVPR.2009.5206594},
  timestamp = {Fri, 14 Feb 2020 11:46:23 +0100},
  biburl    = {https://dblp.org/rec/conf/cvpr/LampertNH09.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Others}
}


// from BI Sheng

@inproceedings{DBLP:conf/acl/BaoHWWW20,
  author    = {Siqi Bao and
               Huang He and
               Fan Wang and
               Hua Wu and
               Haifeng Wang},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {{PLATO:} Pre-trained Dialogue Generation Model with Discrete Latent
               Variable},
  booktitle = {ACL},
  pages     = {85--96},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.9},
  doi       = {10.18653/v1/2020.acl-main.9},
  timestamp = {Thu, 23 Sep 2021 15:08:29 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/BaoHWWW20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords = {AIGC}
}

@inproceedings{DBLP:conf/acl/Cao020,
  author    = {Shuyang Cao and
               Lu Wang},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Controllable Open-ended Question Generation with {A} New Question
               Type Ontology},
  booktitle = {ACL},
  pages     = {6424--6439},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.502},
  doi       = {10.18653/v1/2021.acl-long.502},
  timestamp = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/Cao020.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Controllable Text Generation}
}

@article{DBLP:journals/corr/abs-2006-14799,
  author    = {Asli Celikyilmaz and
               Elizabeth Clark and
               Jianfeng Gao},
  title     = {Evaluation of Text Generation: {A} Survey},
  journal   = {CoRR},
  volume    = {abs/2006.14799},
  year      = {2020},
  url       = {https://arxiv.org/abs/2006.14799},
  eprinttype = {arXiv},
  eprint    = {2006.14799},
  timestamp = {Wed, 03 Mar 2021 07:40:24 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2006-14799.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Evaluation, AIGC, Survey}
}

@inproceedings{DBLP:conf/emnlp/ChenSYW20,
  author    = {Wenhu Chen and
               Yu Su and
               Xifeng Yan and
               William Yang Wang},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {{KGPT:} Knowledge-Grounded Pre-Training for Data-to-Text Generation},
  booktitle = {EMNLP},
  pages     = {8635--8648},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.697},
  doi       = {10.18653/v1/2020.emnlp-main.697},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ChenSYW20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/acl/ChenGCLL20,
  author    = {Yen{-}Chun Chen and
               Zhe Gan and
               Yu Cheng and
               Jingzhou Liu and
               Jingjing Liu},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {Distilling Knowledge Learned in {BERT} for Text Generation},
  booktitle = {ACL},
  pages     = {7893--7905},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.705},
  doi       = {10.18653/v1/2020.acl-main.705},
  timestamp = {Fri, 06 Aug 2021 00:40:57 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/ChenGCLL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Distillation}
}

@inproceedings{DBLP:conf/emnlp/ChenCZZZSW20,
  author    = {Zhiyu Chen and
               Wenhu Chen and
               Hanwen Zha and
               Xiyou Zhou and
               Yunkai Zhang and
               Sairam Sundaresan and
               William Yang Wang},
  editor    = {Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Logic2Text: High-Fidelity Natural Language Generation from Logical
               Forms},
  booktitle = {EMNLP Findings},
  series    = {Findings of {ACL}},
  volume    = {{EMNLP} 2020},
  pages     = {2096--2111},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.190},
  doi       = {10.18653/v1/2020.findings-emnlp.190},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ChenCZZZSW20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/aaai/Chi0WWMH20,
  author    = {Zewen Chi and
               Li Dong and
               Furu Wei and
               Wenhui Wang and
               Xian{-}Ling Mao and
               Heyan Huang},
  title     = {Cross-Lingual Natural Language Generation via Pre-Training},
  booktitle = {AAAI},
  pages     = {7570--7577},
  publisher = {{AAAI} Press},
  year      = {2020},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/6256},
  timestamp = {Mon, 07 Mar 2022 16:58:26 +0100},
  biburl    = {https://dblp.org/rec/conf/aaai/Chi0WWMH20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/iclr/DathathriMLHFMY20,
  author    = {Sumanth Dathathri and
               Andrea Madotto and
               Janice Lan and
               Jane Hung and
               Eric Frank and
               Piero Molino and
               Jason Yosinski and
               Rosanne Liu},
  title     = {Plug and Play Language Models: {A} Simple Approach to Controlled Text
               Generation},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2020},
  url       = {https://openreview.net/forum?id=H1edEyBKDS},
  timestamp = {Thu, 07 May 2020 17:11:48 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/DathathriMLHFMY20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/nips/00040WWLWGZH19,
  author    = {Li Dong and
               Nan Yang and
               Wenhui Wang and
               Furu Wei and
               Xiaodong Liu and
               Yu Wang and
               Jianfeng Gao and
               Ming Zhou and
               Hsiao{-}Wuen Hon},
  editor    = {Hanna M. Wallach and
               Hugo Larochelle and
               Alina Beygelzimer and
               Florence d'Alch{\'{e}}{-}Buc and
               Emily B. Fox and
               Roman Garnett},
  title     = {Unified Language Model Pre-training for Natural Language Understanding
               and Generation},
  booktitle = {NeurIPS},
  pages     = {13042--13054},
  year      = {2019},
  url       = {https://proceedings.neurips.cc/paper/2019/hash/c20bb2d9a50d5ac1f713f8b34d9aac5a-Abstract.html},
  timestamp = {Mon, 30 May 2022 13:48:58 +0200},
  biburl    = {https://dblp.org/rec/conf/nips/00040WWLWGZH19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Natural Language Understanding}
}

@article{DBLP:journals/corr/abs-2103-10360,
  author    = {Zhengxiao Du and
               Yujie Qian and
               Xiao Liu and
               Ming Ding and
               Jiezhong Qiu and
               Zhilin Yang and
               Jie Tang},
  title     = {All {NLP} Tasks Are Generation Tasks: {A} General Pretraining Framework},
  journal   = {CoRR},
  volume    = {abs/2103.10360},
  year      = {2021},
  url       = {https://arxiv.org/abs/2103.10360},
  eprinttype = {arXiv},
  eprint    = {2103.10360},
  timestamp = {Wed, 24 Mar 2021 15:50:40 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2103-10360.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/RibeiroPZG21,
  author    = {Leonardo F. R. Ribeiro and
               Jonas Pfeiffer and
               Yue Zhang and
               Iryna Gurevych},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Smelting Gold and Silver for Improved Multilingual AMR-to-Text Generation},
  booktitle = {EMNLP},
  pages     = {742--750},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.57},
  doi       = {10.18653/v1/2021.emnlp-main.57},
  timestamp = {Thu, 20 Jan 2022 10:02:20 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/RibeiroPZG21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}


@article{DBLP:journals/corr/abs-2007-15780,
  author    = {Cristina Garbacea and
               Qiaozhu Mei},
  title     = {Neural Language Generation: Formulation, Methods, and Evaluation},
  journal   = {CoRR},
  volume    = {abs/2007.15780},
  year      = {2020},
  url       = {https://arxiv.org/abs/2007.15780},
  eprinttype = {arXiv},
  eprint    = {2007.15780},
  timestamp = {Mon, 03 Aug 2020 14:32:13 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2007-15780.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Evaluation}
}

@inproceedings{DBLP:conf/acl/GolovanovKNTTW19,
  author    = {Sergey Golovanov and
               Rauf Kurbanov and
               Sergey I. Nikolenko and
               Kyryl Truskovskyi and
               Alexander Tselousov and
               Thomas Wolf},
  editor    = {Anna Korhonen and
               David R. Traum and
               Llu{\'{\i}}s M{\`{a}}rquez},
  title     = {Large-Scale Transfer Learning for Natural Language Generation},
  booktitle = {ACL},
  pages     = {6053--6058},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/p19-1608},
  doi       = {10.18653/v1/p19-1608},
  timestamp = {Fri, 06 Aug 2021 00:41:01 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/GolovanovKNTTW19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/coling/GongSFQBLL20,
  author    = {Heng Gong and
               Yawei Sun and
               Xiaocheng Feng and
               Bing Qin and
               Wei Bi and
               Xiaojiang Liu and
               Ting Liu},
  editor    = {Donia Scott and
               N{\'{u}}ria Bel and
               Chengqing Zong},
  title     = {TableGPT: Few-shot Table-to-Text Generation with Table Structure Reconstruction
               and Content Matching},
  booktitle = {COLING},
  pages     = {1978--1988},
  publisher = {International Committee on Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.coling-main.179},
  doi       = {10.18653/v1/2020.coling-main.179},
  timestamp = {Fri, 06 Aug 2021 00:39:57 +0200},
  biburl    = {https://dblp.org/rec/conf/coling/GongSFQBLL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/GuWWSY20,
  author    = {Jing Gu and
               Qingyang Wu and
               Chongruo Wu and
               Weiyan Shi and
               Zhou Yu},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {{PRAL:} {A} Tailored Pre-Training Model for Task-Oriented Dialog Generation},
  booktitle = {ACL},
  pages     = {305--313},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-short.40},
  doi       = {10.18653/v1/2021.acl-short.40},
  timestamp = {Mon, 09 Aug 2021 16:25:38 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/GuWWSY20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/aaai/GuYH21,
  author    = {Xiaodong Gu and
               Kang Min Yoo and
               Jung{-}Woo Ha},
  title     = {DialogBERT: Discourse-Aware Response Generation via Learning to Recover
               and Rank Utterances},
  booktitle = {AAAI},
  pages     = {12911--12919},
  publisher = {{AAAI} Press},
  year      = {2021},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/17527},
  timestamp = {Mon, 26 Sep 2022 11:56:49 +0200},
  biburl    = {https://dblp.org/rec/conf/aaai/GuYH21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/corr/abs-2111-02643,
  author    = {Xiaodong Gu and
               Kang Min Yoo and
               Sang{-}Woo Lee},、
  title     = {Response Generation with Context-Aware Prompt Learning},
  journal   = {CoRR},
  volume    = {abs/2111.02643},
  year      = {2021},
  url       = {https://arxiv.org/abs/2111.02643},
  eprinttype = {arXiv},
  eprint    = {2111.02643},
  timestamp = {Thu, 13 Oct 2022 08:59:00 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2111-02643.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, In-Context Learning}
}

@article{DBLP:journals/tacl/GuanHHZZ20,
  author    = {Jian Guan and
               Fei Huang and
               Minlie Huang and
               Zhihao Zhao and
               Xiaoyan Zhu},
  title     = {A Knowledge-Enhanced Pretraining Model for Commonsense Story Generation},
  journal   = {TACL},
  volume    = {8},
  pages     = {93--108},
  year      = {2020},
  url       = {https://doi.org/10.1162/tacl\_a\_00302},
  doi       = {10.1162/tacl\_a\_00302},
  timestamp = {Fri, 10 Jun 2022 10:35:17 +0200},
  biburl    = {https://dblp.org/rec/journals/tacl/GuanHHZZ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/coling/HarkousGS20,
  author    = {Hamza Harkous and
               Isabel Groves and
               Amir Saffari},
  editor    = {Donia Scott and
               N{\'{u}}ria Bel and
               Chengqing Zong},
  title     = {Have Your Text and Use It Too! End-to-End Neural Data-to-Text Generation
               with Semantic Fidelity},
  booktitle = {COLING},
  pages     = {2410--2424},
  publisher = {International Committee on Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.coling-main.218},
  doi       = {10.18653/v1/2020.coling-main.218},
  timestamp = {Fri, 06 Aug 2021 00:39:46 +0200},
  biburl    = {https://dblp.org/rec/conf/coling/HarkousGS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/HuaS020,
  author    = {Xinyu Hua and
               Ashwin Sreevatsa and
               Lu Wang},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {{DYPLOC:} Dynamic Planning of Content Using Mixed Language Models
               for Text Generation},
  booktitle = {ACL},
  pages     = {6408--6423},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.501},
  doi       = {10.18653/v1/2021.acl-long.501},
  timestamp = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/HuaS020.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/HuangQSZ21,
  author    = {Xinting Huang and
               Jianzhong Qi and
               Yu Sun and
               Rui Zhang},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Latent Reasoning for Low-Resource Question Generation},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {3008--3022},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.265},
  doi       = {10.18653/v1/2021.findings-acl.265},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/HuangQSZ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/jksucis/IqbalQ22,
  author    = {Touseef Iqbal and
               Shaima Qureshi},
  title     = {The survey: Text generation models in deep learning},
  journal   = {JKSUCIS},
  volume    = {34},
  number    = {6 Part {A}},
  pages     = {2515--2528},
  year      = {2022},
  url       = {https://doi.org/10.1016/j.jksuci.2020.04.001},
  doi       = {10.1016/j.jksuci.2020.04.001},
  timestamp = {Mon, 19 Dec 2022 17:10:36 +0100},
  biburl    = {https://dblp.org/rec/journals/jksucis/IqbalQ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Survey}
}

@inproceedings{DBLP:conf/acl/KeJRCWSZH21,
  author    = {Pei Ke and
               Haozhe Ji and
               Yu Ran and
               Xin Cui and
               Liwei Wang and
               Linfeng Song and
               Xiaoyan Zhu and
               Minlie Huang},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {JointGT: Graph-Text Joint Representation Learning for Text Generation
               from Knowledge Graphs},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {2526--2538},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.223},
  doi       = {10.18653/v1/2021.findings-acl.223},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/KeJRCWSZH21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/corr/abs-1909-05858,
  author    = {Nitish Shirish Keskar and
               Bryan McCann and
               Lav R. Varshney and
               Caiming Xiong and
               Richard Socher},
  title     = {{CTRL:} {A} Conditional Transformer Language Model for Controllable
               Generation},
  journal   = {CoRR},
  volume    = {abs/1909.05858},
  year      = {2019},
  url       = {http://arxiv.org/abs/1909.05858},
  eprinttype = {arXiv},
  eprint    = {1909.05858},
  timestamp = {Wed, 18 Sep 2019 10:38:36 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1909-05858.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/iclr/KhalifaED21,
  author    = {Muhammad Khalifa and
               Hady Elsahar and
               Marc Dymetman},
  title     = {A Distributional Approach to Controlled Text Generation},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2021},
  url       = {https://openreview.net/forum?id=jWkw45-9AbL},
  timestamp = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/KhalifaED21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/emnlp/KrishnaWI20,
  author    = {Kalpesh Krishna and
               John Wieting and
               Mohit Iyyer},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Reformulating Unsupervised Style Transfer as Paraphrase Generation},
  booktitle = {EMNLP},
  pages     = {737--762},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.55},
  doi       = {10.18653/v1/2020.emnlp-main.55},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/KrishnaWI20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/LewisLGGMLSZ20,
  author    = {Mike Lewis and
               Yinhan Liu and
               Naman Goyal and
               Marjan Ghazvininejad and
               Abdelrahman Mohamed and
               Omer Levy and
               Veselin Stoyanov and
               Luke Zettlemoyer},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {{BART:} Denoising Sequence-to-Sequence Pre-training for Natural Language
               Generation, Translation, and Comprehension},
  booktitle = {ACL},
  pages     = {7871--7880},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.703},
  doi       = {10.18653/v1/2020.acl-main.703},
  timestamp = {Wed, 16 Mar 2022 23:55:02 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/LewisLGGMLSZ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/cikm/LiLZHWYW20,
  author    = {Junyi Li and
               Siqing Li and
               Wayne Xin Zhao and
               Gaole He and
               Zhicheng Wei and
               Nicholas Jing Yuan and
               Ji{-}Rong Wen},
  editor    = {Mathieu d'Aquin and
               Stefan Dietze and
               Claudia Hauff and
               Edward Curry and
               Philippe Cudr{\'{e}}{-}Mauroux},
  title     = {Knowledge-Enhanced Personalized Review Generation with Capsule Graph
               Neural Network},
  booktitle = {CIKM},
  pages     = {735--744},
  publisher = {{ACM}},
  year      = {2020},
  url       = {https://doi.org/10.1145/3340531.3411893},
  doi       = {10.1145/3340531.3411893},
  timestamp = {Thu, 14 Oct 2021 10:46:17 +0200},
  biburl    = {https://dblp.org/rec/conf/cikm/LiLZHWYW20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/acl/LiTHJHXCYZW21,
  author    = {Junyi Li and
               Tianyi Tang and
               Gaole He and
               Jinhao Jiang and
               Xiaoxuan Hu and
               Puzhao Xie and
               Zhipeng Chen and
               Zhuohao Yu and
               Wayne Xin Zhao and
               Ji{-}Rong Wen},
  editor    = {Heng Ji and
               Jong C. Park and
               Rui Xia},
  title     = {TextBox: {A} Unified, Modularized, and Extensible Framework for Text
               Generation},
  booktitle = {ACL},
  pages     = {30--39},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-demo.4},
  doi       = {10.18653/v1/2021.acl-demo.4},
  timestamp = {Wed, 07 Dec 2022 23:10:02 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/LiTHJHXCYZW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/LiTZWYW21,
  author    = {Junyi Li and
               Tianyi Tang and
               Wayne Xin Zhao and
               Zhicheng Wei and
               Nicholas Jing Yuan and
               Ji{-}Rong Wen},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Few-shot Knowledge Graph-to-Text Generation with Pretrained Language
               Models},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {1558--1568},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.136},
  doi       = {10.18653/v1/2021.findings-acl.136},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/LiTZWYW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/sigir/LiZWYW21,
  author    = {Junyi Li and
               Wayne Xin Zhao and
               Zhicheng Wei and
               Nicholas Jing Yuan and
               Ji{-}Rong Wen},
  editor    = {Fernando Diaz and
               Chirag Shah and
               Torsten Suel and
               Pablo Castells and
               Rosie Jones and
               Tetsuya Sakai},
  title     = {Knowledge-based Review Generation by Coherence Enhanced Text Planning},
  booktitle = {SIGIR},
  pages     = {183--192},
  publisher = {{ACM}},
  year      = {2021},
  url       = {https://doi.org/10.1145/3404835.3462865},
  doi       = {10.1145/3404835.3462865},
  timestamp = {Thu, 15 Jul 2021 15:30:48 +0200},
  biburl    = {https://dblp.org/rec/conf/sigir/LiZWYW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/acl/LiZLS20,
  author    = {Piji Li and
               Haisong Zhang and
               Xiaojiang Liu and
               Shuming Shi},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {Rigid Formats Controlled Text Generation},
  booktitle = {ACL},
  pages     = {742--751},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.68},
  doi       = {10.18653/v1/2020.acl-main.68},
  timestamp = {Fri, 06 Aug 2021 00:40:57 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/LiZLS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Controllable AIGC}
}

@inproceedings{DBLP:conf/acl/LiL20,
  author    = {Xiang Lisa Li and
               Percy Liang},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Prefix-Tuning: Optimizing Continuous Prompts for Generation},
  booktitle = {ACL},
  pages     = {4582--4597},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.353},
  doi       = {10.18653/v1/2021.acl-long.353},
  timestamp = {Wed, 16 Mar 2022 23:55:03 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/LiL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Prompt Engineering}
}

@inproceedings{DBLP:conf/acl/LiuYGQZJCFSGWCJ21,
  author    = {Dayiheng Liu and
               Yu Yan and
               Yeyun Gong and
               Weizhen Qi and
               Hang Zhang and
               Jian Jiao and
               Weizhu Chen and
               Jie Fu and
               Linjun Shou and
               Ming Gong and
               Pengcheng Wang and
               Jiusheng Chen and
               Daxin Jiang and
               Jiancheng Lv and
               Ruofei Zhang and
               Winnie Wu and
               Ming Zhou and
               Nan Duan},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {{GLGE:} {A} New General Language Generation Evaluation Benchmark},
  booktitle = {ACL},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {408--420},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.36},
  doi       = {10.18653/v1/2021.findings-acl.36},
  timestamp = {Thu, 12 Jan 2023 14:29:18 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/LiuYGQZJCFSGWCJ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Evaluation}
}

@inproceedings{DBLP:conf/emnlp/LiuZLRZY21,
  author    = {Shilei Liu and
               Xiaofeng Zhao and
               Bochao Li and
               Feiliang Ren and
               Longhui Zhang and
               Shujuan Yin},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {A Three-Stage Learning Framework for Low-Resource Knowledge-Grounded
               Dialogue Generation},
  booktitle = {EMNLP},
  pages     = {2262--2272},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.173},
  doi       = {10.18653/v1/2021.emnlp-main.173},
  timestamp = {Wed, 07 Dec 2022 23:12:22 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/LiuZLRZY21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/acl/Luo0LLBHHS20,
  author    = {Fuli Luo and
               Wei Wang and
               Jiahao Liu and
               Yijia Liu and
               Bin Bi and
               Songfang Huang and
               Fei Huang and
               Luo Si},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {{VECO:} Variable and Flexible Cross-lingual Pre-training for Language
               Understanding and Generation},
  booktitle = {ACL},
  pages     = {3980--3994},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.308},
  doi       = {10.18653/v1/2021.acl-long.308},
  timestamp = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/Luo0LLBHHS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Natural Language Understanding}
}

@article{DBLP:journals/corr/abs-2002-06353,
  author    = {Huaishao Luo and
               Lei Ji and
               Botian Shi and
               Haoyang Huang and
               Nan Duan and
               Tianrui Li and
               Xilin Chen and
               Ming Zhou},
  title     = {UniViLM: {A} Unified Video and Language Pre-Training Model for Multimodal
               Understanding and Generation},
  journal   = {CoRR},
  volume    = {abs/2002.06353},
  year      = {2020},
  url       = {https://arxiv.org/abs/2002.06353},
  eprinttype = {arXiv},
  eprint    = {2002.06353},
  timestamp = {Wed, 20 Jul 2022 10:55:47 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2002-06353.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Multimodal, Nutural Language Understanding}
}

@inproceedings{DBLP:conf/acl/MagerANSLFR20,
  author    = {Manuel Mager and
               Ram{\'{o}}n Fernandez Astudillo and
               Tahira Naseem and
               Md. Arafat Sultan and
               Young{-}Suk Lee and
               Radu Florian and
               Salim Roukos},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {GPT-too: {A} Language-Model-First Approach for AMR-to-Text Generation},
  booktitle = {ACL},
  pages     = {1846--1852},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.167},
  doi       = {10.18653/v1/2020.acl-main.167},
  timestamp = {Fri, 06 Aug 2021 00:41:04 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/MagerANSLFR20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}
@inproceedings{DBLP:conf/naacl/MajumderRGM21,
  author    = {Bodhisattwa Prasad Majumder and
               Sudha Rao and
               Michel Galley and
               Julian J. McAuley},
  editor    = {Kristina Toutanova and
               Anna Rumshisky and
               Luke Zettlemoyer and
               Dilek Hakkani{-}T{\"{u}}r and
               Iz Beltagy and
               Steven Bethard and
               Ryan Cotterell and
               Tanmoy Chakraborty and
               Yichao Zhou},
  title     = {Ask what's missing and what's useful: Improving Clarification Question
               Generation using Global Knowledge},
  booktitle = {NAACL},
  pages     = {4300--4312},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.naacl-main.340},
  doi       = {10.18653/v1/2021.naacl-main.340},
  timestamp = {Fri, 06 Aug 2021 00:41:31 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/MajumderRGM21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/emnlp/MaoMMC19,
  author    = {Huanru Henry Mao and
               Bodhisattwa Prasad Majumder and
               Julian J. McAuley and
               Garrison W. Cottrell},
  editor    = {Kentaro Inui and
               Jing Jiang and
               Vincent Ng and
               Xiaojun Wan},
  title     = {Improving Neural Story Generation by Targeted Common Sense Grounding},
  booktitle = {EMNLP},
  pages     = {5987--5992},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/D19-1615},
  doi       = {10.18653/v1/D19-1615},
  timestamp = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/MaoMMC19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/MauryaDKD21,
  author    = {Kaushal Kumar Maurya and
               Maunendra Sankar Desarkar and
               Yoshinobu Kano and
               Kumari Deepshikha},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {ZmBART: An Unsupervised Cross-lingual Transfer Framework for Language
               Generation},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {2804--2818},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.248},
  doi       = {10.18653/v1/2021.findings-acl.248},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/MauryaDKD21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/PascualEMCW21,
  author    = {Damian Pascual and
               Beni Egressy and
               Clara Meister and
               Ryan Cotterell and
               Roger Wattenhofer},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {A Plug-and-Play Method for Controlled Text Generation},
  booktitle = {ACL Findings},
  pages     = {3973--3997},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-emnlp.334},
  doi       = {10.18653/v1/2021.findings-emnlp.334},
  timestamp = {Thu, 20 Jan 2022 10:02:07 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/PascualEMCW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/emnlp/PengZLLLZG20,
  author    = {Baolin Peng and
               Chenguang Zhu and
               Chunyuan Li and
               Xiujun Li and
               Jinchao Li and
               Michael Zeng and
               Jianfeng Gao},
  editor    = {Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Few-shot Natural Language Generation for Task-Oriented Dialog},
  booktitle = {EMNLP Findings},
  series    = {Findings of {ACL}},
  volume    = {{EMNLP} 2020},
  pages     = {172--182},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.17},
  doi       = {10.18653/v1/2020.findings-emnlp.17},
  timestamp = {Fri, 13 May 2022 11:42:33 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/PengZLLLZG20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/RashkinCCG20,
  author    = {Hannah Rashkin and
               Asli Celikyilmaz and
               Yejin Choi and
               Jianfeng Gao},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {PlotMachines: Outline-Conditioned Generation with Dynamic Plot State
               Tracking},
  booktitle = {EMNLP},
  pages     = {4274--4295},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.349},
  doi       = {10.18653/v1/2020.emnlp-main.349},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/RashkinCCG20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/corr/abs-2007-08426,
  author    = {Leonardo F. R. Ribeiro and
               Martin Schmitt and
               Hinrich Sch{\"{u}}tze and
               Iryna Gurevych},
  title     = {Investigating Pretrained Language Models for Graph-to-Text Generation},
  journal   = {CoRR},
  volume    = {abs/2007.08426},
  year      = {2020},
  url       = {https://arxiv.org/abs/2007.08426},
  eprinttype = {arXiv},
  eprint    = {2007.08426},
  timestamp = {Wed, 22 Jul 2020 12:09:15 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2007-08426.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/RibeiroZG21,
  author    = {Leonardo F. R. Ribeiro and
               Yue Zhang and
               Iryna Gurevych},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Structural Adapters in Pretrained Language Models for AMR-to-Text
               Generation},
  booktitle = {EMNLP},
  pages     = {4269--4282},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.351},
  doi       = {10.18653/v1/2021.emnlp-main.351},
  timestamp = {Thu, 20 Jan 2022 10:02:24 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/RibeiroZG21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/tacl/RotheNS20,
  author    = {Sascha Rothe and
               Shashi Narayan and
               Aliaksei Severyn},
  title     = {Leveraging Pre-trained Checkpoints for Sequence Generation Tasks},
  journal   = {TACL},
  volume    = {8},
  pages     = {264--280},
  year      = {2020},
  url       = {https://doi.org/10.1162/tacl\_a\_00313},
  doi       = {10.1162/tacl\_a\_00313},
  timestamp = {Fri, 10 Jun 2022 10:35:17 +0200},
  biburl    = {https://dblp.org/rec/journals/tacl/RotheNS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/icml/SongTQLL19,
  author    = {Kaitao Song and
               Xu Tan and
               Tao Qin and
               Jianfeng Lu and
               Tie{-}Yan Liu},
  editor    = {Kamalika Chaudhuri and
               Ruslan Salakhutdinov},
  title     = {{MASS:} Masked Sequence to Sequence Pre-training for Language Generation},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {97},
  pages     = {5926--5936},
  publisher = {{PMLR}},
  year      = {2019},
  url       = {http://proceedings.mlr.press/v97/song19d.html},
  timestamp = {Fri, 04 Dec 2020 15:21:06 +0100},
  biburl    = {https://dblp.org/rec/conf/icml/SongTQLL19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/SuadaaKFOT20,
  author    = {Lya Hulliyyatus Suadaa and
               Hidetaka Kamigaito and
               Kotaro Funakoshi and
               Manabu Okumura and
               Hiroya Takamura},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Towards Table-to-Text Generation with Numerical Reasoning},
  booktitle = {ACL},
  pages     = {1451--1465},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.115},
  doi       = {10.18653/v1/2021.acl-long.115},
  timestamp = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/SuadaaKFOT20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/corr/abs-2107-02137,
  author    = {Yu Sun and
               Shuohuan Wang and
               Shikun Feng and
               Siyu Ding and
               Chao Pang and
               Junyuan Shang and
               Jiaxiang Liu and
               Xuyi Chen and
               Yanbin Zhao and
               Yuxiang Lu and
               Weixin Liu and
               Zhihua Wu and
               Weibao Gong and
               Jianzhong Liang and
               Zhizhou Shang and
               Peng Sun and
               Wei Liu and
               Xuan Ouyang and
               Dianhai Yu and
               Hao Tian and
               Hua Wu and
               Haifeng Wang},
  title     = {{ERNIE} 3.0: Large-scale Knowledge Enhanced Pre-training for Language
               Understanding and Generation},
  journal   = {CoRR},
  volume    = {abs/2107.02137},
  year      = {2021},
  url       = {https://arxiv.org/abs/2107.02137},
  eprinttype = {arXiv},
  eprint    = {2107.02137},
  timestamp = {Tue, 15 Mar 2022 17:41:07 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2107-02137.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/naacl/TanYAXH21,
  author    = {Bowen Tan and
               Zichao Yang and
               Maruan Al{-}Shedivat and
               Eric P. Xing and
               Zhiting Hu},
  editor    = {Kristina Toutanova and
               Anna Rumshisky and
               Luke Zettlemoyer and
               Dilek Hakkani{-}T{\"{u}}r and
               Iz Beltagy and
               Steven Bethard and
               Ryan Cotterell and
               Tanmoy Chakraborty and
               Yichao Zhou},
  title     = {Progressive Generation of Long Text with Pretrained Language Models},
  booktitle = {NAACL},
  pages     = {4313--4324},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.naacl-main.341},
  doi       = {10.18653/v1/2021.naacl-main.341},
  timestamp = {Fri, 06 Aug 2021 00:41:32 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/TanYAXH21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/WangPPCWL20,
  author    = {Boxin Wang and
               Hengzhi Pei and
               Boyuan Pan and
               Qian Chen and
               Shuohang Wang and
               Bo Li},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {{T3:} Tree-Autoencoder Constrained Adversarial Text Generation for
               Targeted Attack},
  booktitle = {EMNLP},
  pages     = {6134--6150},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.495},
  doi       = {10.18653/v1/2020.emnlp-main.495},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/WangPPCWL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}
@inproceedings{DBLP:conf/ecir/WangLZ21,
  author    = {Wei Wang and
               Piji Li and
               Hai{-}Tao Zheng},
  editor    = {Djoerd Hiemstra and
               Marie{-}Francine Moens and
               Josiane Mothe and
               Raffaele Perego and
               Martin Potthast and
               Fabrizio Sebastiani},
  title     = {Consistency and Coherency Enhanced Story Generation},
  booktitle = {ECIR},
  series    = {Lecture Notes in Computer Science},
  volume    = {12656},
  pages     = {694--709},
  publisher = {Springer},
  year      = {2021},
  url       = {https://doi.org/10.1007/978-3-030-72113-8\_46},
  doi       = {10.1007/978-3-030-72113-8\_46},
  timestamp = {Tue, 30 Mar 2021 18:55:01 +0200},
  biburl    = {https://dblp.org/rec/conf/ecir/WangLZ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/XingW21,
  author    = {Xinyu Xing and
               Xiaojun Wan},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Structure-Aware Pre-Training for Table-to-Text Generation},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {2273--2278},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.200},
  doi       = {10.18653/v1/2021.findings-acl.200},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/XingW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/XuPSPFAC20,
  author    = {Peng Xu and
               Mostofa Patwary and
               Mohammad Shoeybi and
               Raul Puri and
               Pascale Fung and
               Anima Anandkumar and
               Bryan Catanzaro},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {{MEGATRON-CNTRL:} Controllable Story Generation with External Knowledge
               Using Large-Scale Language Models},
  booktitle = {EMNLP},
  pages     = {2831--2845},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.226},
  doi       = {10.18653/v1/2020.emnlp-main.226},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/XuPSPFAC20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Knowledge Enhanced}
}

@inproceedings{DBLP:conf/acl/XuWKL20,
  author    = {Xinnuo Xu and
               Guoyin Wang and
               Young{-}Bum Kim and
               Sungjin Lee},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {AugNLG: Few-shot Natural Language Generation using Self-trained Data
               Augmentation},
  booktitle = {ACL},
  pages     = {1183--1195},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.95},
  doi       = {10.18653/v1/2021.acl-long.95},
  timestamp = {Mon, 03 Jan 2022 15:14:00 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/XuWKL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/XueSW0ZQZL20,
  author    = {Lanqing Xue and
               Kaitao Song and
               Duocai Wu and
               Xu Tan and
               Nevin L. Zhang and
               Tao Qin and
               Wei{-}Qiang Zhang and
               Tie{-}Yan Liu},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {DeepRapper: Neural Rap Generation with Rhyme and Rhythm Modeling},
  booktitle = {ACL},
  pages     = {69--81},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.6},
  doi       = {10.18653/v1/2021.acl-long.6},
  timestamp = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/XueSW0ZQZL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/YanHCBYGDCCZ21,
  author    = {Yu Yan and
               Fei Hu and
               Jiusheng Chen and
               Nikhil Bhendawade and
               Ting Ye and
               Yeyun Gong and
               Nan Duan and
               Desheng Cui and
               Bingyu Chi and
               Ruofei Zhang},
  editor    = {Heng Ji and
               Jong C. Park and
               Rui Xia},
  title     = {FastSeq: Make Sequence Generation Faster},
  booktitle = {ACL},
  pages     = {218--226},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-demo.26},
  doi       = {10.18653/v1/2021.acl-demo.26},
  timestamp = {Mon, 01 Aug 2022 16:27:43 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/YanHCBYGDCCZ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/emnlp/Yang0XLBWWL20,
  author    = {Ze Yang and
               Wei Wu and
               Can Xu and
               Xinnian Liang and
               Jiaqi Bai and
               Liran Wang and
               Wei Wang and
               Zhoujun Li},
  editor    = {Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {StyleDGPT: Stylized Response Generation with Pre-trained Language
               Models},
  booktitle = {EMNLP Findings},
  series    = {Findings of {ACL}},
  volume    = {{EMNLP} 2020},
  pages     = {1548--1559},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.140},
  doi       = {10.18653/v1/2020.findings-emnlp.140},
  timestamp = {Fri, 05 Aug 2022 08:38:44 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/Yang0XLBWWL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@article{DBLP:journals/corr/abs-2010-11140,
  author    = {Yan Zeng and
               Jian{-}Yun Nie},
  title     = {Generalized Conditioned Dialogue Generation Based on Pre-trained Language
               Model},
  journal   = {CoRR},
  volume    = {abs/2010.11140},
  year      = {2020},
  url       = {https://arxiv.org/abs/2010.11140},
  eprinttype = {arXiv},
  eprint    = {2010.11140},
  timestamp = {Fri, 06 Aug 2021 09:05:03 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2010-11140.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/naacl/ZengN21,
  author    = {Yan Zeng and
               Jian{-}Yun Nie},
  editor    = {Kristina Toutanova and
               Anna Rumshisky and
               Luke Zettlemoyer and
               Dilek Hakkani{-}T{\"{u}}r and
               Iz Beltagy and
               Steven Bethard and
               Ryan Cotterell and
               Tanmoy Chakraborty and
               Yichao Zhou},
  title     = {A Simple and Efficient Multi-Task Learning Approach for Conditioned
               Dialogue Generation},
  booktitle = {NAACL},
  pages     = {4927--4939},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.naacl-main.392},
  doi       = {10.18653/v1/2021.naacl-main.392},
  timestamp = {Fri, 06 Aug 2021 09:05:00 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/ZengN21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/iclr/ZhangKWWA20,
  author    = {Tianyi Zhang and
               Varsha Kishore and
               Felix Wu and
               Kilian Q. Weinberger and
               Yoav Artzi},
  title     = {BERTScore: Evaluating Text Generation with {BERT}},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2020},
  url       = {https://openreview.net/forum?id=SkeHuCVFDr},
  timestamp = {Wed, 03 Jun 2020 10:08:32 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/ZhangKWWA20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC, Evaluation}
}

@inproceedings{DBLP:conf/sigir/ZhangJSC0FXL21,
  author    = {Xueying Zhang and
               Yunjiang Jiang and
               Yue Shang and
               Zhaomeng Cheng and
               Chi Zhang and
               Xiaochuan Fan and
               Yun Xiao and
               Bo Long},
  editor    = {Fernando Diaz and
               Chirag Shah and
               Torsten Suel and
               Pablo Castells and
               Rosie Jones and
               Tetsuya Sakai},
  title     = {{DSGPT:} Domain-Specific Generative Pre-Training of Transformers for
               Text Generation in E-commerce Title and Review Summarization},
  booktitle = {SIGIR},
  pages     = {2146--2150},
  publisher = {{ACM}},
  year      = {2021},
  url       = {https://doi.org/10.1145/3404835.3463037},
  doi       = {10.1145/3404835.3463037},
  timestamp = {Thu, 15 Jul 2021 15:30:48 +0200},
  biburl    = {https://dblp.org/rec/conf/sigir/ZhangJSC0FXL21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}

@inproceedings{DBLP:conf/acl/ZhangSGCBGGLD20,
  author    = {Yizhe Zhang and
               Siqi Sun and
               Michel Galley and
               Yen{-}Chun Chen and
               Chris Brockett and
               Xiang Gao and
               Jianfeng Gao and
               Jingjing Liu and
               Bill Dolan},
  editor    = {Asli Celikyilmaz and
               Tsung{-}Hsien Wen},
  title     = {{DIALOGPT} : Large-Scale Generative Pre-training for Conversational
               Response Generation},
  booktitle = {ACL},
  pages     = {270--278},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-demos.30},
  doi       = {10.18653/v1/2020.acl-demos.30},
  timestamp = {Fri, 06 Aug 2021 00:41:00 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/ZhangSGCBGGLD20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={AIGC}
}


// from MIN Denghai

@article{DBLP:journals/corr/HintonVD15,
  author    = {Geoffrey E. Hinton and
               Oriol Vinyals and
               Jeffrey Dean},
  title     = {Distilling the Knowledge in a Neural Network},
  journal   = {CoRR},
  volume    = {abs/1503.02531},
  year      = {2015},
  url       = {http://arxiv.org/abs/1503.02531},
  eprinttype = {arXiv},
  eprint    = {1503.02531},
  timestamp = {Mon, 13 Aug 2018 16:48:36 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/HintonVD15.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/aaai/MirzadehFLLMG20,
  author    = {Seyed{-}Iman Mirzadeh and
               Mehrdad Farajtabar and
               Ang Li and
               Nir Levine and
               Akihiro Matsukawa and
               Hassan Ghasemzadeh},
  title     = {Improved Knowledge Distillation via Teacher Assistant},
  booktitle = {AAAI},
  pages     = {5191--5198},
  publisher = {{AAAI} Press},
  year      = {2020},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/5963},
  timestamp = {Mon, 07 Mar 2022 16:57:42 +0100},
  biburl    = {https://dblp.org/rec/conf/aaai/MirzadehFLLMG20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/cvpr/ParkKLC19,
  author    = {Wonpyo Park and
               Dongju Kim and
               Yan Lu and
               Minsu Cho},
  title     = {Relational Knowledge Distillation},
  booktitle = {CVPR},
  pages     = {3967--3976},
  publisher = {Computer Vision Foundation / {IEEE}},
  year      = {2019},
  url       = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Park\_Relational\_Knowledge\_Distillation\_CVPR\_2019\_paper.html},
  doi       = {10.1109/CVPR.2019.00409},
  timestamp = {Mon, 30 Aug 2021 17:01:14 +0200},
  biburl    = {https://dblp.org/rec/conf/cvpr/ParkKLC19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@article{DBLP:journals/corr/SauB16,
  author    = {Bharat Bhusan Sau and
               Vineeth N. Balasubramanian},
  title     = {Deep Model Compression: Distilling Knowledge from Noisy Teachers},
  journal   = {CoRR},
  volume    = {abs/1610.09650},
  year      = {2016},
  url       = {http://arxiv.org/abs/1610.09650},
  eprinttype = {arXiv},
  eprint    = {1610.09650},
  timestamp = {Mon, 13 Aug 2018 16:48:05 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/SauB16.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/iclr/ZagoruykoK17,
  author    = {Sergey Zagoruyko and
               Nikos Komodakis},
  title     = {Paying More Attention to Attention: Improving the Performance of Convolutional
               Neural Networks via Attention Transfer},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2017},
  url       = {https://openreview.net/forum?id=Sks9\_ajex},
  timestamp = {Thu, 25 Jul 2019 14:25:41 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/ZagoruykoK17.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@article{DBLP:journals/corr/abs-1909-11723,
  author    = {Li Yuan and
               Francis E. H. Tay and
               Guilin Li and
               Tao Wang and
               Jiashi Feng},
  title     = {Revisit Knowledge Distillation: a Teacher-free Framework},
  journal   = {CoRR},
  volume    = {abs/1909.11723},
  year      = {2019},
  url       = {http://arxiv.org/abs/1909.11723},
  eprinttype = {arXiv},
  eprint    = {1909.11723},
  timestamp = {Thu, 19 Nov 2020 20:36:33 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1909-11723.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/iclr/TarvainenV17,
  author    = {Antti Tarvainen and
               Harri Valpola},
  title     = {Mean teachers are better role models: Weight-averaged consistency
               targets improve semi-supervised deep learning results},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2017},
  url       = {https://openreview.net/forum?id=ry8u21rtl},
  timestamp = {Thu, 04 Apr 2019 13:20:08 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/TarvainenV17.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
keywords={Knowledge Distillation},
code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/iccv/JinPWLLLYH19,
  author    = {Xiao Jin and
               Baoyun Peng and
               Yichao Wu and
               Yu Liu and
               Jiaheng Liu and
               Ding Liang and
               Junjie Yan and
               Xiaolin Hu},
  title     = {Knowledge Distillation via Route Constrained Optimization},
  booktitle = {ICCV},
  pages     = {1345--1354},
  publisher = {{IEEE}},
  year      = {2019},
  url       = {https://doi.org/10.1109/ICCV.2019.00143},
  doi       = {10.1109/ICCV.2019.00143},
  timestamp = {Mon, 16 Mar 2020 17:55:53 +0100},
  biburl    = {https://dblp.org/rec/conf/iccv/JinPWLLLYH19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/icml/FurlanelloLTIA18,
  author    = {Tommaso Furlanello and
               Zachary Chase Lipton and
               Michael Tschannen and
               Laurent Itti and
               Anima Anandkumar},
  editor    = {Jennifer G. Dy and
               Andreas Krause},
  title     = {Born-Again Neural Networks},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {80},
  pages     = {1602--1611},
  publisher = {{PMLR}},
  year      = {2018},
  url       = {http://proceedings.mlr.press/v80/furlanello18a.html},
  timestamp = {Wed, 03 Apr 2019 18:17:30 +0200},
  biburl    = {https://dblp.org/rec/conf/icml/FurlanelloLTIA18.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@article{DBLP:journals/ijon/WenLQ21,
  author    = {Tiancheng Wen and
               Shenqi Lai and
               Xueming Qian},
  title     = {Preparing lessons: Improve knowledge distillation with better supervision},
  journal   = {Neurocomputing},
  volume    = {454},
  pages     = {25--33},
  year      = {2021},
  url       = {https://doi.org/10.1016/j.neucom.2021.04.102},
  doi       = {10.1016/j.neucom.2021.04.102},
  timestamp = {Tue, 16 Aug 2022 23:06:48 +0200},
  biburl    = {https://dblp.org/rec/journals/ijon/WenLQ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@article{DBLP:journals/corr/abs-1910-05057,
  author    = {Elahe Arani and
               Fahad Sarfraz and
               Bahram Zonooz},
  title     = {Improving Generalization and Robustness with Noisy Collaboration in
               Knowledge Distillation},
  journal   = {CoRR},
  volume    = {abs/1910.05057},
  year      = {2019},
  url       = {http://arxiv.org/abs/1910.05057},
  eprinttype = {arXiv},
  eprint    = {1910.05057},
  timestamp = {Wed, 16 Oct 2019 16:25:53 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1910-05057.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@article{DBLP:journals/corr/abs-1903-12136,
  author    = {Raphael Tang and
               Yao Lu and
               Linqing Liu and
               Lili Mou and
               Olga Vechtomova and
               Jimmy Lin},
  title     = {Distilling Task-Specific Knowledge from {BERT} into Simple Neural
               Networks},
  journal   = {CoRR},
  volume    = {abs/1903.12136},
  year      = {2019},
  url       = {http://arxiv.org/abs/1903.12136},
  eprinttype = {arXiv},
  eprint    = {1903.12136},
  timestamp = {Tue, 02 Apr 2019 11:16:55 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1903-12136.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@article{DBLP:journals/corr/ZhangXHL17,
  author    = {Ying Zhang and
               Tao Xiang and
               Timothy M. Hospedales and
               Huchuan Lu},
  title     = {Deep Mutual Learning},
  journal   = {CoRR},
  volume    = {abs/1706.00384},
  year      = {2017},
  url       = {http://arxiv.org/abs/1706.00384},
  eprinttype = {arXiv},
  eprint    = {1706.00384},
  timestamp = {Wed, 09 Jan 2019 14:59:45 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/ZhangXHL17.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/iclr/FrankleC19,
  author    = {Jonathan Frankle and
               Michael Carbin},
  title     = {The Lottery Ticket Hypothesis: Finding Sparse, Trainable Neural Networks},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2019},
  url       = {https://openreview.net/forum?id=rJl-b3RcF7},
  timestamp = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/FrankleC19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}

@inproceedings{DBLP:conf/cvpr/YunPLS20,
  author    = {Sukmin Yun and
               Jongjin Park and
               Kimin Lee and
               Jinwoo Shin},
  title     = {Regularizing Class-Wise Predictions via Self-Knowledge Distillation},
  booktitle = {CVPR},
  pages     = {13873--13882},
  publisher = {Computer Vision Foundation / {IEEE}},
  year      = {2020},
  url       = {https://openaccess.thecvf.com/content_CVPR_2020/papers/Yun_Regularizing_Class-Wise_Predictions_via_Self-Knowledge_Distillation_CVPR_2020_paper.pdf},
  doi       = {10.1109/CVPR42600.2020.01389},
  timestamp = {Tue, 31 Aug 2021 14:00:04 +0200},
  biburl    = {https://dblp.org/rec/conf/cvpr/YunPLS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
    keywords={Knowledge Distillation},
    code = {https://github.com/SforAiDl/KD_Lib}
}


// 0214


@article{DBLP:journals/corr/abs-2301-00774,
  author    = {Elias Frantar and
               Dan Alistarh},
  title     = {SparseGPT: Massive Language Models Can Be Accurately Pruned in One-Shot},
  journal   = {CoRR},
  volume    = {abs/2301.00774},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.00774},
  doi       = {10.48550/arXiv.2301.00774},
  eprinttype = {arXiv},
  eprint    = {2301.00774},
  timestamp = {Thu, 19 Jan 2023 07:41:01 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-00774.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}


// from DAI Xinbang

@incollection{DBLP:series/lncs/LyuXWY20,
  author    = {Lingjuan Lyu and
               Xinyi Xu and
               Qian Wang and
               Han Yu},
  editor    = {Qiang Yang and
               Lixin Fan and
               Han Yu},
  title     = {Collaborative Fairness in Federated Learning},
  booktitle = {FLPI},
  series    = {Lecture Notes in Computer Science},
  volume    = {12500},
  pages     = {189--204},
  publisher = {Springer},
  year      = {2020},
  url       = {https://doi.org/10.1007/978-3-030-63076-8\_14},
  doi       = {10.1007/978-3-030-63076-8\_14},
  timestamp = {Tue, 19 Apr 2022 16:03:59 +0200},
  biburl    = {https://dblp.org/rec/series/lncs/LyuXWY20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@inproceedings{DBLP:conf/icml/00050BS21,
  author    = {Tian Li and
               Shengyuan Hu and
               Ahmad Beirami and
               Virginia Smith},
  editor    = {Marina Meila and
               Tong Zhang},
  title     = {Ditto: Fair and Robust Federated Learning Through Personalization},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {139},
  pages     = {6357--6368},
  publisher = {{PMLR}},
  year      = {2021},
  url       = {http://proceedings.mlr.press/v139/li21h.html},
  timestamp = {Wed, 25 Aug 2021 17:11:17 +0200},
  biburl    = {https://dblp.org/rec/conf/icml/00050BS21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@article{DBLP:journals/isci/HuangLWDZH22,
  author    = {Wei Huang and
               Tianrui Li and
               Dexian Wang and
               Shengdong Du and
               Junbo Zhang and
               Tianqiang Huang},
  title     = {Fairness and accuracy in horizontal federated learning},
  journal   = {JIS},
  volume    = {589},
  pages     = {170--185},
  year      = {2022},
  url       = {https://doi.org/10.1016/j.ins.2021.12.102},
  doi       = {10.1016/j.ins.2021.12.102},
  timestamp = {Fri, 18 Feb 2022 10:36:34 +0100},
  biburl    = {https://dblp.org/rec/journals/isci/HuangLWDZH22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@article{DBLP:journals/corr/abs-2108-07313,
  author    = {Gary Cheng and
               Karan N. Chadha and
               John C. Duchi},
  title     = {Fine-tuning is Fine in Federated Learning},
  journal   = {CoRR},
  volume    = {abs/2108.07313},
  year      = {2021},
  url       = {https://arxiv.org/abs/2108.07313},
  eprinttype = {arXiv},
  eprint    = {2108.07313},
  timestamp = {Fri, 20 Aug 2021 13:55:54 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2108-07313.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@article{DBLP:journals/tnse/HuSZY22,
  author    = {Zeou Hu and
               Kiarash Shaloudegi and
               Guojun Zhang and
               Yaoliang Yu},
  title     = {Federated Learning Meets Multi-Objective Optimization},
  journal   = {TNSE},
  volume    = {9},
  number    = {4},
  pages     = {2039--2051},
  year      = {2022},
  url       = {https://doi.org/10.1109/TNSE.2022.3169117},
  doi       = {10.1109/TNSE.2022.3169117},
  timestamp = {Mon, 25 Jul 2022 08:40:16 +0200},
  biburl    = {https://dblp.org/rec/journals/tnse/HuSZY22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@inproceedings{DBLP:conf/ijcai/WangF0WWY21,
  author    = {Zheng Wang and
               Xiaoliang Fan and
               Jianzhong Qi and
               Chenglu Wen and
               Cheng Wang and
               Rongshan Yu},
  editor    = {Zhi{-}Hua Zhou},
  title     = {Federated Learning with Fair Averaging},
  booktitle = {IJCAI},
  pages     = {1615--1623},
  publisher = {ijcai.org},
  year      = {2021},
  url       = {https://doi.org/10.24963/ijcai.2021/223},
  doi       = {10.24963/ijcai.2021/223},
  timestamp = {Sat, 04 Sep 2021 14:47:47 +0200},
  biburl    = {https://dblp.org/rec/conf/ijcai/WangF0WWY21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@inproceedings{DBLP:conf/eccv/HsuQ020,
  author    = {Tzu{-}Ming Harry Hsu and
               Hang Qi and
               Matthew Brown},
  editor    = {Andrea Vedaldi and
               Horst Bischof and
               Thomas Brox and
               Jan{-}Michael Frahm},
  title     = {Federated Visual Classification with Real-World Data Distribution},
  booktitle = {ECCV},
  series    = {Lecture Notes in Computer Science},
  volume    = {12355},
  pages     = {76--92},
  publisher = {Springer},
  year      = {2020},
  url       = {https://doi.org/10.1007/978-3-030-58607-2\_5},
  doi       = {10.1007/978-3-030-58607-2\_5},
  timestamp = {Tue, 10 Nov 2020 14:04:43 +0100},
  biburl    = {https://dblp.org/rec/conf/eccv/HsuQ020.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@article{DBLP:journals/kais/LiuHZLJXD22,
  author    = {Ji Liu and
               Jizhou Huang and
               Yang Zhou and
               Xuhong Li and
               Shilei Ji and
               Haoyi Xiong and
               Dejing Dou},
  title     = {From distributed machine learning to federated learning: a survey},
  journal   = {KIS},
  volume    = {64},
  number    = {4},
  pages     = {885--917},
  year      = {2022},
  url       = {https://doi.org/10.1007/s10115-022-01664-x},
  doi       = {10.1007/s10115-022-01664-x},
  timestamp = {Thu, 23 Jun 2022 20:05:07 +0200},
  biburl    = {https://dblp.org/rec/journals/kais/LiuHZLJXD22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning, Survey}
}

@inproceedings{DBLP:conf/ijcai/Chen0YCDHC22,
  author    = {Mingyang Chen and
               Wen Zhang and
               Zhen Yao and
               Xiangnan Chen and
               Mengxiao Ding and
               Fei Huang and
               Huajun Chen},
  editor    = {Luc De Raedt},
  title     = {Meta-Learning Based Knowledge Extrapolation for Knowledge Graphs in
               the Federated Setting},
  booktitle = {IJCAI},
  pages     = {1966--1972},
  publisher = {ijcai.org},
  year      = {2022},
  url       = {https://doi.org/10.24963/ijcai.2022/273},
  doi       = {10.24963/ijcai.2022/273},
  timestamp = {Wed, 27 Jul 2022 16:43:00 +0200},
  biburl    = {https://dblp.org/rec/conf/ijcai/Chen0YCDHC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@inproceedings{DBLP:conf/cikm/ChuHTCDLB22,
  author    = {Yun{-}Wei Chu and
               Seyyedali Hosseinalipour and
               Elizabeth Tenorio and
               Laura M. Cruz Castro and
               Kerrie A. Douglas and
               Andrew Lan and
               Christopher G. Brinton},
  editor    = {Mohammad Al Hasan and
               Li Xiong},
  title     = {Mitigating Biases in Student Performance Prediction via Attention-Based
               Personalized Federated Learning},
  booktitle = {CIKM},
  pages     = {3033--3042},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3511808.3557108},
  doi       = {10.1145/3511808.3557108},
  timestamp = {Wed, 19 Oct 2022 17:09:02 +0200},
  biburl    = {https://dblp.org/rec/conf/cikm/ChuHTCDLB22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@inproceedings{DBLP:conf/naacl/WellerMBLD22,
  author    = {Orion Weller and
               Marc Marone and
               Vladimir Braverman and
               Dawn J. Lawrie and
               Benjamin Van Durme},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Pretrained Models for Multilingual Federated Learning},
  booktitle = {NAACL},
  pages     = {1413--1421},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.101},
  doi       = {10.18653/v1/2022.naacl-main.101},
  timestamp = {Mon, 01 Aug 2022 16:28:01 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/WellerMBLD22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@inproceedings{DBLP:conf/cvpr/QuZLXW00R22,
  author    = {Liangqiong Qu and
               Yuyin Zhou and
               Paul Pu Liang and
               Yingda Xia and
               Feifei Wang and
               Ehsan Adeli and
               Li Fei{-}Fei and
               Daniel L. Rubin},
  title     = {Rethinking Architecture Design for Tackling Data Heterogeneity in
               Federated Learning},
  booktitle = {CVPR},
  pages     = {10051--10061},
  publisher = {{IEEE}},
  year      = {2022},
  url       = {https://doi.org/10.1109/CVPR52688.2022.00982},
  doi       = {10.1109/CVPR52688.2022.00982},
  timestamp = {Wed, 05 Oct 2022 16:31:19 +0200},
  biburl    = {https://dblp.org/rec/conf/cvpr/QuZLXW00R22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@article{DBLP:journals/tist/TianWLYJS22,
  author    = {Yuanyishu Tian and
               Yao Wan and
               Lingjuan Lyu and
               Dezhong Yao and
               Hai Jin and
               Lichao Sun},
  title     = {FedBERT: When Federated Learning Meets Pre-training},
  journal   = {TIST},
  volume    = {13},
  number    = {4},
  pages     = {66:1--66:26},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510033},
  doi       = {10.1145/3510033},
  timestamp = {Tue, 13 Dec 2022 09:59:50 +0100},
  biburl    = {https://dblp.org/rec/journals/tist/TianWLYJS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning}
}

@article{DBLP:journals/corr/abs-2210-08090,
  author    = {John Nguyen and
               Jianyu Wang and
               Kshitiz Malik and
               Maziar Sanjabi and
               Michael Rabbat},
  title     = {Where to Begin? On the Impact of Pre-Training and Initialization in
               Federated Learning},
  journal   = {CoRR},
  volume    = {abs/2210.08090},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.08090},
  doi       = {10.48550/arXiv.2210.08090},
  eprinttype = {arXiv},
  eprint    = {2210.08090},
  timestamp = {Tue, 18 Oct 2022 15:06:52 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-08090.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Federated Learning},
}

@inproceedings{DBLP:conf/sc/Zheng0WZSSGZK20,
  author    = {Da Zheng and
               Chao Ma and
               Minjie Wang and
               Jinjing Zhou and
               Qidong Su and
               Xiang Song and
               Quan Gan and
               Zheng Zhang and
               George Karypis},
  title     = {DistDGL: Distributed Graph Neural Network Training for Billion-Scale
               Graphs},
  booktitle = {IA3},
  pages     = {36--44},
  publisher = {{IEEE}},
  year      = {2020},
  url       = {https://doi.org/10.1109/IA351965.2020.00011},
  doi       = {10.1109/IA351965.2020.00011},
  timestamp = {Tue, 10 Aug 2021 16:44:53 +0200},
  biburl    = {https://dblp.org/rec/conf/sc/Zheng0WZSSGZK20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@inproceedings{DBLP:conf/edbt/Sheikh0GR22,
  author    = {Nasrullah Sheikh and
               Xiao Qin and
               Yaniv Gur and
               Berthold Reinwald},
  editor    = {Julia Stoyanovich and
               Jens Teubner and
               Paolo Guagliardo and
               Milos Nikolic and
               Andreas Pieris and
               Jan M{\"{u}}hlig and
               Fatma {\"{O}}zcan and
               Sebastian Schelter and
               H. V. Jagadish and
               Meihui Zhang},
  title     = {Distributed Training of Knowledge Graph Embedding Models using Ray},
  booktitle = {EDBT},
  pages     = {2:549--2:553},
  publisher = {OpenProceedings.org},
  year      = {2022},
  url       = {https://doi.org/10.48786/edbt.2022.48},
  doi       = {10.48786/edbt.2022.48},
  timestamp = {Tue, 11 Oct 2022 14:23:40 +0200},
  biburl    = {https://dblp.org/rec/conf/edbt/Sheikh0GR22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@article{DBLP:journals/jstsp/ChenBTS22,
  author    = {Yicheng Chen and
               Rick S. Blum and
               Martin Tak{\'{a}}c and
               Brian M. Sadler},
  title     = {Distributed Learning With Sparsified Gradient Differences},
  journal   = {{IEEE} },
  volume    = {16},
  number    = {3},
  pages     = {585--600},
  year      = {2022},
  url       = {https://doi.org/10.1109/JSTSP.2022.3162989},
  doi       = {10.1109/JSTSP.2022.3162989},
  timestamp = {Wed, 11 Jan 2023 07:38:17 +0100},
  biburl    = {https://dblp.org/rec/journals/jstsp/ChenBTS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@inproceedings{DBLP:conf/europar/DongLWGQLYVD21,
  author    = {Daxiang Dong and
               Ji Liu and
               Xi Wang and
               Weibao Gong and
               An Qin and
               Xingjian Li and
               Dianhai Yu and
               Patrick Valduriez and
               Dejing Dou},
  editor    = {Ricardo Chaves and
               Dora B. Heras and
               Aleksandar Ilic and
               Didem Unat and
               Rosa M. Badia and
               Andrea Bracciali and
               Patrick Diehl and
               Anshu Dubey and
               Oh Sangyoon and
               Stephen L. Scott and
               Laura Ricci},
  title     = {Elastic Deep Learning Using Knowledge Distillation with Heterogeneous
               Computing Resources},
  booktitle = {Euro-Par},
  series    = {Lecture Notes in Computer Science},
  volume    = {13098},
  pages     = {116--128},
  publisher = {Springer},
  year      = {2021},
  url       = {https://doi.org/10.1007/978-3-031-06156-1\_10},
  doi       = {10.1007/978-3-031-06156-1\_10},
  timestamp = {Tue, 14 Feb 2023 22:22:15 +0100},
  biburl    = {https://dblp.org/rec/conf/europar/DongLWGQLYVD21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@inproceedings{DBLP:conf/icdcs/XuHADBKCK21,
  author    = {Hang Xu and
               Chen{-}Yu Ho and
               Ahmed M. Abdelmoniem and
               Aritra Dutta and
               El Houcine Bergou and
               Konstantinos Karatsenidis and
               Marco Canini and
               Panos Kalnis},
  title     = {{GRACE:} {A} Compressed Communication Framework for Distributed Machine
               Learning},
  booktitle = {ICDCS},
  pages     = {561--572},
  publisher = {{IEEE}},
  year      = {2021},
  url       = {https://doi.org/10.1109/ICDCS51616.2021.00060},
  doi       = {10.1109/ICDCS51616.2021.00060},
  timestamp = {Mon, 03 Jan 2022 22:38:16 +0100},
  biburl    = {https://dblp.org/rec/conf/icdcs/XuHADBKCK21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@INPROCEEDINGS{9817156,
  author={Esmaeilzadeh, Armin and Zadeh Nojoo Kambar, Mina Esmail and Heidari, Maryam},
  booktitle={AIIoT},
  title={Graph Attention Neural Network Distributed Model Training},
  year={2022},
  volume={},
  number={},
  pages={447-452},
  doi={10.1109/AIIoT54504.2022.9817156},
  url={https://ieeexplore.ieee.org/document/9817156},
  keywords={Distributed AI}
}

@inproceedings{DBLP:conf/icpads/MaLCW21,
  author    = {Delu Ma and
               Zhou Lei and
               Shengbo Chen and
               Peng Wang},
  title     = {Load Balancing Optimization for Transformer in Distributed Environment},
  booktitle = {ICPADS},
  pages     = {827--834},
  publisher = {{IEEE}},
  year      = {2021},
  url       = {https://doi.org/10.1109/ICPADS53394.2021.00109},
  doi       = {10.1109/ICPADS53394.2021.00109},
  timestamp = {Mon, 09 May 2022 09:35:52 +0200},
  biburl    = {https://dblp.org/rec/conf/icpads/MaLCW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@article{DBLP:journals/pvldb/LiZVSNLPSVDC20,
  author    = {Shen Li and
               Yanli Zhao and
               Rohan Varma and
               Omkar Salpekar and
               Pieter Noordhuis and
               Teng Li and
               Adam Paszke and
               Jeff Smith and
               Brian Vaughan and
               Pritam Damania and
               Soumith Chintala},
  title     = {PyTorch Distributed: Experiences on Accelerating Data Parallel Training},
  journal   = {VLDB},
  volume    = {13},
  number    = {12},
  pages     = {3005--3018},
  year      = {2020},
  url       = {http://www.vldb.org/pvldb/vol13/p3005-li.pdf},
  doi       = {10.14778/3415478.3415530},
  timestamp = {Wed, 16 Mar 2022 23:53:41 +0100},
  biburl    = {https://dblp.org/rec/journals/pvldb/LiZVSNLPSVDC20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}

@inproceedings{DBLP:conf/osdi/MoritzNWTLLEYPJ18,
  author    = {Philipp Moritz and
               Robert Nishihara and
               Stephanie Wang and
               Alexey Tumanov and
               Richard Liaw and
               Eric Liang and
               Melih Elibol and
               Zongheng Yang and
               William Paul and
               Michael I. Jordan and
               Ion Stoica},
  editor    = {Andrea C. Arpaci{-}Dusseau and
               Geoff Voelker},
  title     = {Ray: {A} Distributed Framework for Emerging {AI} Applications},
  booktitle = {OSDI},
  pages     = {561--577},
  publisher = {{USENIX} Association},
  year      = {2018},
  url       = {https://www.usenix.org/conference/osdi18/presentation/nishihara},
  timestamp = {Tue, 02 Feb 2021 08:06:02 +0100},
  biburl    = {https://dblp.org/rec/conf/osdi/MoritzNWTLLEYPJ18.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Distributed AI}
}


// from CHEN Zizhuo

@inproceedings{DBLP:conf/issta/ZengTZLZZ22,
  author    = {Zhengran Zeng and
               Hanzhuo Tan and
               Haotian Zhang and
               Jing Li and
               Yuqun Zhang and
               Lingming Zhang},
  editor    = {Sukyoung Ryu and
               Yannis Smaragdakis},
  title     = {An extensive study on pre-trained models for program understanding
               and generation},
  booktitle = {ISSTA},
  pages     = {39--51},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3533767.3534390},
  doi       = {10.1145/3533767.3534390},
  timestamp = {Tue, 26 Jul 2022 16:38:30 +0200},
  biburl    = {https://dblp.org/rec/conf/issta/ZengTZLZZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@article{DBLP:journals/corr/abs-2207-01780,
  author    = {Hung Le and
               Yue Wang and
               Akhilesh Deepak Gotmare and
               Silvio Savarese and
               Steven C. H. Hoi},
  title     = {CodeRL: Mastering Code Generation through Pretrained Models and Deep
               Reinforcement Learning},
  journal   = {CoRR},
  volume    = {abs/2207.01780},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2207.01780},
  doi       = {10.48550/arXiv.2207.01780},
  eprinttype = {arXiv},
  eprint    = {2207.01780},
  timestamp = {Wed, 06 Jul 2022 15:50:43 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2207-01780.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@article{wangcodet5mix,
  title={CodeT5Mix: A Pretrained Mixture of Encoder-decoder Transformers for Code Understanding and Generation},
  author={Wang, Yue and Le, Hung and Gotmare, Akhilesh Deepak and Li, Junnan and Hoi, Steven},
  url={https://openreview.net/pdf?id=VPCi3STZcaO},
  booktitle={openreview},
  year = {2023},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/emnlp/0034WJH21,
  author    = {Yue Wang and
               Weishi Wang and
               Shafiq R. Joty and
               Steven C. H. Hoi},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {CodeT5: Identifier-aware Unified Pre-trained Encoder-Decoder Models
               for Code Understanding and Generation},
  booktitle = {EMNLP},
  pages     = {8696--8708},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.685},
  doi       = {10.18653/v1/2021.emnlp-main.685},
  timestamp = {Thu, 20 Jan 2022 10:02:24 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/0034WJH21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@article{zhou2023codebertscore,
  title={CodeBERTScore: Evaluating Code Generation with Pretrained Models of Code},
  author={Zhou, Shuyan and Alon, Uri and Agarwal, Sumit and Neubig, Graham},
  journal={CoRR},
  year={2023},
  url={https://arxiv.org/abs/2302.05527},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/nips/LuGRHSBCDJTLZSZ21,
  author    = {Shuai Lu and
               Daya Guo and
               Shuo Ren and
               Junjie Huang and
               Alexey Svyatkovskiy and
               Ambrosio Blanco and
               Colin B. Clement and
               Dawn Drain and
               Daxin Jiang and
               Duyu Tang and
               Ge Li and
               Lidong Zhou and
               Linjun Shou and
               Long Zhou and
               Michele Tufano and
               Ming Gong and
               Ming Zhou and
               Nan Duan and
               Neel Sundaresan and
               Shao Kun Deng and
               Shengyu Fu and
               Shujie Liu},
  editor    = {Joaquin Vanschoren and
               Sai{-}Kit Yeung},
  title     = {CodeXGLUE: {A} Machine Learning Benchmark Dataset for Code Understanding
               and Generation},
  booktitle = {NeurIPS},
  year      = {2021},
  url       = {https://datasets-benchmarks-proceedings.neurips.cc/paper/2021/hash/c16a5320fa475530d9583c34fd356ef5-Abstract-round1.html},
  timestamp = {Wed, 06 Jul 2022 08:37:30 +0200},
  biburl    = {https://dblp.org/rec/conf/nips/LuGRHSBCDJTLZSZ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/sigsoft/SvyatkovskiyDFS20,
  author    = {Alexey Svyatkovskiy and
               Shao Kun Deng and
               Shengyu Fu and
               Neel Sundaresan},
  editor    = {Prem Devanbu and
               Myra B. Cohen and
               Thomas Zimmermann},
  title     = {IntelliCode compose: Code Generation using transformer},
  booktitle = {FSE},
  pages     = {1433--1443},
  publisher = {{ACM}},
  year      = {2020},
  url       = {https://doi.org/10.1145/3368089.3417058},
  doi       = {10.1145/3368089.3417058},
  timestamp = {Tue, 10 Nov 2020 10:58:23 +0100},
  biburl    = {https://dblp.org/rec/conf/sigsoft/SvyatkovskiyDFS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}

}

@inproceedings{DBLP:conf/naacl/AhmadCRC21,
  author    = {Wasi Uddin Ahmad and
               Saikat Chakraborty and
               Baishakhi Ray and
               Kai{-}Wei Chang},
  editor    = {Kristina Toutanova and
               Anna Rumshisky and
               Luke Zettlemoyer and
               Dilek Hakkani{-}T{\"{u}}r and
               Iz Beltagy and
               Steven Bethard and
               Ryan Cotterell and
               Tanmoy Chakraborty and
               Yichao Zhou},
  title     = {Unified Pre-training for Program Understanding and Generation},
  booktitle = {NAACL},
  pages     = {2655--2668},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.naacl-main.211},
  doi       = {10.18653/v1/2021.naacl-main.211},
  timestamp = {Fri, 06 Aug 2021 00:41:31 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/AhmadCRC21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/naacl/WangWWWZLWL22,
  author    = {Xin Wang and
               Yasheng Wang and
               Yao Wan and
               Jiawei Wang and
               Pingyi Zhou and
               Li Li and
               Hao Wu and
               Jin Liu},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {{CODE-MVP:} Learning to Represent Source Code from Multiple Views
               with Contrastive Pre-Training},
  booktitle = {NAACL},
  pages     = {1066--1077},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.findings-naacl.80},
  doi       = {10.18653/v1/2022.findings-naacl.80},
  timestamp = {Tue, 03 Jan 2023 13:58:27 +0100},
  biburl    = {https://dblp.org/rec/conf/naacl/WangWWWZLWL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Representation}
}

@inproceedings{DBLP:conf/iclr/GuoRLFT0ZDSFTDC21,
  author    = {Daya Guo and
               Shuo Ren and
               Shuai Lu and
               Zhangyin Feng and
               Duyu Tang and
               Shujie Liu and
               Long Zhou and
               Nan Duan and
               Alexey Svyatkovskiy and
               Shengyu Fu and
               Michele Tufano and
               Shao Kun Deng and
               Colin B. Clement and
               Dawn Drain and
               Neel Sundaresan and
               Jian Yin and
               Daxin Jiang and
               Ming Zhou},
  title     = {GraphCodeBERT: Pre-training Code Representations with Data Flow},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2021},
  url       = {https://openreview.net/forum?id=jLoC4ez43PZ},
  timestamp = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/GuoRLFT0ZDSFTDC21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Representation}
}

@article{DBLP:journals/corr/abs-2108-04556,
  author    = {Xin Wang and
               Yasheng Wang and
               Pingyi Zhou and
               Fei Mi and
               Meng Xiao and
               Yadao Wang and
               Li Li and
               Xiao Liu and
               Hao Wu and
               Jin Liu and
               Xin Jiang},
  title     = {{CLSEBERT:} Contrastive Learning for Syntax Enhanced Code Pre-Trained
               Model},
  journal   = {CoRR},
  volume    = {abs/2108.04556},
  year      = {2021},
  url       = {https://arxiv.org/abs/2108.04556},
  eprinttype = {arXiv},
  eprint    = {2108.04556},
  timestamp = {Sat, 21 Jan 2023 21:14:09 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2108-04556.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Representation, Multimodal}
}

@inproceedings{DBLP:conf/acl/GuoLDW0022,
  author    = {Daya Guo and
               Shuai Lu and
               Nan Duan and
               Yanlin Wang and
               Ming Zhou and
               Jian Yin},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {UniXcoder: Unified Cross-Modal Pre-training for Code Representation},
  booktitle = {ACL},
  pages     = {7212--7225},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.499},
  doi       = {10.18653/v1/2022.acl-long.499},
  timestamp = {Mon, 01 Aug 2022 16:27:41 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/GuoLDW0022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Representation}
}

@inproceedings{DBLP:conf/msr/MashhadiH21,
  author    = {Ehsan Mashhadi and
               Hadi Hemmati},
  title     = {Applying CodeBERT for Automated Program Repair of Java Simple Bugs},
  booktitle = {MSR},
  pages     = {505--509},
  publisher = {{IEEE}},
  year      = {2021},
  url       = {https://doi.org/10.1109/MSR52588.2021.00063},
  doi       = {10.1109/MSR52588.2021.00063},
  timestamp = {Fri, 02 Jul 2021 15:01:28 +0200},
  biburl    = {https://dblp.org/rec/conf/msr/MashhadiH21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@article{matsumoto2021model,
  title={A model with iterative trials for correcting logic errors in source code},
  author={Matsumoto, Taku and Watanobe, Yutaka and Nakamura, Keita},
  journal={Applied Sciences},
  volume={11},
  number={11},
  pages={4755},
  year={2021},
  publisher={MDPI},
  url={https://www.mdpi.com/2076-3417/11/11/4755},
  keywords={Code Fixing}
}

@inproceedings{DBLP:conf/issta/YuanZHFHHY22,
  author    = {Wei Yuan and
               Quanjun Zhang and
               Tieke He and
               Chunrong Fang and
               Nguyen Quoc Viet Hung and
               Xiaodong Hao and
               Hongzhi Yin},
  editor    = {Sukyoung Ryu and
               Yannis Smaragdakis},
  title     = {{CIRCLE:} continual repair across programming languages},
  booktitle = {ISSTA},
  pages     = {678--690},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3533767.3534219},
  doi       = {10.1145/3533767.3534219},
  timestamp = {Sun, 02 Oct 2022 16:10:13 +0200},
  biburl    = {https://dblp.org/rec/conf/issta/YuanZHFHHY22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@article{DBLP:journals/corr/abs-2105-09352,
  author    = {Dawn Drain and
               Colin B. Clement and
               Guillermo Serrato and
               Neel Sundaresan},
  title     = {DeepDebug: Fixing Python Bugs Using Stack Traces, Backtranslation,
               and Code Skeletons},
  journal   = {CoRR},
  volume    = {abs/2105.09352},
  year      = {2021},
  url       = {https://arxiv.org/abs/2105.09352},
  eprinttype = {arXiv},
  eprint    = {2105.09352},
  timestamp = {Mon, 31 May 2021 16:16:57 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2105-09352.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@inproceedings{DBLP:conf/emnlp/Bui0H22,
  author    = {Nghi Bui and
               Yue Wang and
               Steven C. H. Hoi},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Detect-Localize-Repair: {A} Unified Framework for Learning to Debug
               with CodeT5},
  booktitle = {EMNLP Findings},
  pages     = {812--823},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.57},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/Bui0H22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@inproceedings{DBLP:conf/wasa/JiangXWZ22,
  author    = {Xuxiang Jiang and
               Yinhao Xiao and
               Jun Wang and
               Wei Zhang},
  editor    = {Lei Wang and
               Michael Segal and
               Jenhui Chen and
               Tie Qiu},
  title     = {Multi-view Pre-trained Model for Code Vulnerability Identification},
  booktitle = {WASA},
  series    = {Lecture Notes in Computer Science},
  volume    = {13473},
  pages     = {127--135},
  publisher = {Springer},
  year      = {2022},
  url       = {https://doi.org/10.1007/978-3-031-19211-1\_11},
  doi       = {10.1007/978-3-031-19211-1\_11},
  timestamp = {Fri, 18 Nov 2022 20:51:16 +0100},
  biburl    = {https://dblp.org/rec/conf/wasa/JiangXWZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@inproceedings{DBLP:conf/icse-apr/LajkoCV22,
  author    = {M{\'{a}}rk Lajk{\'{o}} and
               Viktor Csuvik and
               L{\'{a}}szl{\'{o}} Vid{\'{a}}cs},
  title     = {Towards JavaScript program repair with Generative Pre-trained Transformer
               {(GPT-2)}},
  booktitle = {ICSE},
  pages     = {61--68},
  publisher = {{IEEE}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3524459.3527350},
  doi       = {10.1145/3524459.3527350},
  timestamp = {Mon, 11 Jul 2022 12:33:41 +0200},
  biburl    = {https://dblp.org/rec/conf/icse-apr/LajkoCV22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@inproceedings{DBLP:conf/ijcai/NiuL0022,
  author    = {Changan Niu and
               Chuanyi Li and
               Bin Luo and
               Vincent Ng},
  editor    = {Luc De Raedt},
  title     = {Deep Learning Meets Software Engineering: {A} Survey on Pre-Trained
               Models of Source Code},
  booktitle = {IJCAI},
  pages     = {5546--5555},
  publisher = {ijcai.org},
  year      = {2022},
  url       = {https://doi.org/10.24963/ijcai.2022/775},
  doi       = {10.24963/ijcai.2022/775},
  timestamp = {Wed, 27 Jul 2022 16:43:00 +0200},
  biburl    = {https://dblp.org/rec/conf/ijcai/NiuL0022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Software Engineering, Survey}
}

@article{DBLP:journals/corr/abs-2211-10623,
  author    = {Yao Li and
               Tao Zhang and
               Xiapu Luo and
               Haipeng Cai and
               Sen Fang and
               Dawei Yuan},
  title     = {Do Pre-trained Language Models Indeed Understand Software Engineering
               Tasks?},
  journal   = {CoRR},
  volume    = {abs/2211.10623},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.10623},
  doi       = {10.48550/arXiv.2211.10623},
  eprinttype = {arXiv},
  eprint    = {2211.10623},
  timestamp = {Mon, 28 Nov 2022 07:07:22 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-10623.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Software Engineering}
}

@article{DBLP:journals/corr/abs-2104-05861,
  author    = {Mohammad Abdul Hadi and
               Fatemeh H. Fard},
  title     = {Evaluating Pre-Trained Models for User Feedback Analysis in Software
               Engineering: {A} Study on Classification of App-Reviews},
  journal   = {CoRR},
  volume    = {abs/2104.05861},
  year      = {2021},
  url       = {https://arxiv.org/abs/2104.05861},
  eprinttype = {arXiv},
  eprint    = {2104.05861},
  timestamp = {Mon, 19 Apr 2021 16:45:47 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2104-05861.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Software Engineering, Evaluation}
}

@inproceedings{zhang2020sentiment,
  title={Sentiment analysis for software engineering: How far can pre-trained transformer models go?},
  author={Zhang, Ting and Xu, Bowen and Thung, Ferdian and Haryono, Stefanus Agus and Lo, David and Jiang, Lingxiao},
  booktitle={ICSME},
  pages={70--80},
  year={2020},
  organization={IEEE},
  url={https://ieeexplore.ieee.org/abstract/document/9240704/},
  keywords={Software Engineering}
}

@inproceedings{DBLP:conf/kbse/KarmakarR21,
  author    = {Anjan Karmakar and
               Romain Robbes},
  title     = {What do pre-trained code models know about code?},
  booktitle = {ASE},
  pages     = {1332--1336},
  publisher = {{IEEE}},
  year      = {2021},
  url       = {https://doi.org/10.1109/ASE51524.2021.9678927},
  doi       = {10.1109/ASE51524.2021.9678927},
  timestamp = {Mon, 24 Jan 2022 17:59:41 +0100},
  biburl    = {https://dblp.org/rec/conf/kbse/KarmakarR21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Software Engineering}
}

@inproceedings{DBLP:conf/kbse/LiuLZJ20,
  author    = {Fang Liu and
               Ge Li and
               Yunfei Zhao and
               Zhi Jin},
  title     = {Multi-task Learning based Pre-trained Language Model for Code Completion},
  booktitle = {ASE},
  pages     = {473--485},
  publisher = {{IEEE}},
  year      = {2020},
  url       = {https://doi.org/10.1145/3324884.3416591},
  doi       = {10.1145/3324884.3416591},
  timestamp = {Fri, 12 Feb 2021 13:04:43 +0100},
  biburl    = {https://dblp.org/rec/conf/kbse/LiuLZJ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/kbse/LopezWCS22,
  author    = {Jos{\'{e}} Antonio Hern{\'{a}}ndez L{\'{o}}pez and
               Martin Weyssow and
               Jes{\'{u}}s S{\'{a}}nchez Cuadrado and
               Houari A. Sahraoui},
  title     = {AST-Probe: Recovering abstract syntax trees from hidden representations
               of pre-trained language models},
  booktitle = {ASE},
  pages     = {11:1--11:11},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3551349.3556900},
  doi       = {10.1145/3551349.3556900},
  timestamp = {Wed, 18 Jan 2023 18:17:55 +0100},
  biburl    = {https://dblp.org/rec/conf/kbse/LopezWCS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Representation}
}

@inproceedings{DBLP:conf/kbse/ZhangP0LG22,
  author    = {Jiyang Zhang and
               Sheena Panthaplackel and
               Pengyu Nie and
               Junyi Jessy Li and
               Milos Gligoric},
  title     = {CoditT5: Pretraining for Source Code and Natural Language Editing},
  booktitle = {ASE},
  pages     = {22:1--22:12},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3551349.3556955},
  doi       = {10.1145/3551349.3556955},
  timestamp = {Sun, 15 Jan 2023 18:32:11 +0100},
  biburl    = {https://dblp.org/rec/conf/kbse/ZhangP0LG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/kbse/Shi0XK022,
  author    = {Jieke Shi and
               Zhou Yang and
               Bowen Xu and
               Hong Jin Kang and
               David Lo},
  title     = {Compressing Pre-trained Models of Code into 3 {MB}},
  booktitle = {ASE},
  pages     = {24:1--24:12},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3551349.3556964},
  doi       = {10.1145/3551349.3556964},
  timestamp = {Mon, 09 Jan 2023 10:38:12 +0100},
  biburl    = {https://dblp.org/rec/conf/kbse/Shi0XK022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation, Knowledge Distillation}
}

@inproceedings{DBLP:conf/sigsoft/LiYJYLHLZ22,
  author    = {Lingwei Li and
               Li Yang and
               Huaxi Jiang and
               Jun Yan and
               Tiejian Luo and
               Zihan Hua and
               Geng Liang and
               Chun Zuo},
  editor    = {Abhik Roychoudhury and
               Cristian Cadar and
               Miryung Kim},
  title     = {{AUGER:} automatically generating review comments with pre-training
               models},
  booktitle = {FSE},
  pages     = {1009--1021},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3540250.3549099},
  doi       = {10.1145/3540250.3549099},
  timestamp = {Thu, 10 Nov 2022 12:19:51 +0100},
  biburl    = {https://dblp.org/rec/conf/sigsoft/LiYJYLHLZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Review}
}

@inproceedings{DBLP:conf/sigsoft/LiLGDJJMGSFS22,
  author    = {Zhiyu Li and
               Shuai Lu and
               Daya Guo and
               Nan Duan and
               Shailesh Jannu and
               Grant Jenks and
               Deep Majumder and
               Jared Green and
               Alexey Svyatkovskiy and
               Shengyu Fu and
               Neel Sundaresan},
  editor    = {Abhik Roychoudhury and
               Cristian Cadar and
               Miryung Kim},
  title     = {Automating code review activities by large-scale pre-training},
  booktitle = {FSE},
  pages     = {1035--1047},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3540250.3549081},
  doi       = {10.1145/3540250.3549081},
  timestamp = {Thu, 10 Nov 2022 12:19:51 +0100},
  biburl    = {https://dblp.org/rec/conf/sigsoft/LiLGDJJMGSFS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Review}
}

@inproceedings{DBLP:conf/sigsoft/Zhang0S022,
  author    = {Zhaowei Zhang and
               Hongyu Zhang and
               Beijun Shen and
               Xiaodong Gu},
  editor    = {Abhik Roychoudhury and
               Cristian Cadar and
               Miryung Kim},
  title     = {Diet code is healthy: simplifying programs for pre-trained models
               of code},
  booktitle = {FSE},
  pages     = {1073--1084},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3540250.3549094},
  doi       = {10.1145/3540250.3549094},
  timestamp = {Thu, 10 Nov 2022 12:19:51 +0100},
  biburl    = {https://dblp.org/rec/conf/sigsoft/Zhang0S022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/sigsoft/ChakrabortyADDR22,
  author    = {Saikat Chakraborty and
               Toufique Ahmed and
               Yangruibo Ding and
               Premkumar T. Devanbu and
               Baishakhi Ray},
  editor    = {Abhik Roychoudhury and
               Cristian Cadar and
               Miryung Kim},
  title     = {NatGen: generative pre-training by "naturalizing" source code},
  booktitle = {FSE},
  pages     = {18--30},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3540250.3549162},
  doi       = {10.1145/3540250.3549162},
  timestamp = {Thu, 10 Nov 2022 12:19:51 +0100},
  biburl    = {https://dblp.org/rec/conf/sigsoft/ChakrabortyADDR22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/icse/LinLZ0C21,
  author    = {Jinfeng Lin and
               Yalin Liu and
               Qingkai Zeng and
               Meng Jiang and
               Jane Cleland{-}Huang},
  title     = {Traceability Transformed: Generating more Accurate Links with Pre-Trained
               {BERT} Models},
  booktitle = {ICSE},
  pages     = {324--335},
  publisher = {{IEEE}},
  year      = {2021},
  url       = {https://doi.org/10.1109/ICSE43902.2021.00040},
  doi       = {10.1109/ICSE43902.2021.00040},
  timestamp = {Mon, 19 Dec 2022 09:27:58 +0100},
  biburl    = {https://dblp.org/rec/conf/icse/LinLZ0C21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/icse/WangJLYX0L22,
  author    = {Deze Wang and
               Zhouyang Jia and
               Shanshan Li and
               Yue Yu and
               Yun Xiong and
               Wei Dong and
               Xiangke Liao},
  title     = {Bridging Pre-trained Models and Downstream Tasks for Source Code Understanding},
  booktitle = {ICSE},
  pages     = {287--298},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510003.3510062},
  doi       = {10.1145/3510003.3510062},
  timestamp = {Thu, 02 Feb 2023 19:58:12 +0100},
  biburl    = {https://dblp.org/rec/conf/icse/WangJLYX0L22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Review}
}

@inproceedings{DBLP:conf/icse/JainVINPR022,
  author    = {Naman Jain and
               Skanda Vaidyanath and
               Arun Shankar Iyer and
               Nagarajan Natarajan and
               Suresh Parthasarathy and
               Sriram K. Rajamani and
               Rahul Sharma},
  title     = {Jigsaw: Large Language Models meet Program Synthesis},
  booktitle = {ICSE},
  pages     = {1219--1231},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510003.3510203},
  doi       = {10.1145/3510003.3510203},
  timestamp = {Mon, 18 Jul 2022 16:47:42 +0200},
  biburl    = {https://dblp.org/rec/conf/icse/JainVINPR022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/icse/YangSH022,
  author    = {Zhou Yang and
               Jieke Shi and
               Junda He and
               David Lo},
  title     = {Natural Attack for Pre-trained Models of Code},
  booktitle = {ICSE},
  pages     = {1482--1493},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510003.3510146},
  doi       = {10.1145/3510003.3510146},
  timestamp = {Sun, 12 Feb 2023 18:48:28 +0100},
  biburl    = {https://dblp.org/rec/conf/icse/YangSH022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Program and Code Generation}
}

@inproceedings{DBLP:conf/icse/TufanoMMPPB22,
  author    = {Rosalia Tufano and
               Simone Masiero and
               Antonio Mastropaolo and
               Luca Pascarella and
               Denys Poshyvanyk and
               Gabriele Bavota},
  title     = {Using Pre-Trained Models to Boost Code Review Automation},
  booktitle = {ICSE},
  pages     = {2291--2302},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510003.3510621},
  doi       = {10.1145/3510003.3510621},
  timestamp = {Mon, 18 Jul 2022 16:47:42 +0200},
  biburl    = {https://dblp.org/rec/conf/icse/TufanoMMPPB22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Review}
}

@inproceedings{DBLP:conf/icse/WanZZSXJ22,
  author    = {Yao Wan and
               Wei Zhao and
               Hongyu Zhang and
               Yulei Sui and
               Guandong Xu and
               Hai Jin},
  title     = {What Do They Capture? - {A} Structural Analysis of Pre-Trained Language
               Models for Source Code},
  booktitle = {ICSE},
  pages     = {2377--2388},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510003.3510050},
  doi       = {10.1145/3510003.3510050},
  timestamp = {Tue, 13 Dec 2022 09:59:50 +0100},
  biburl    = {https://dblp.org/rec/conf/icse/WanZZSXJ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Review}
}


// from LI Jiaqi

@inproceedings{DBLP:conf/cvpr/LeiLZGBB021,
  author    = {Jie Lei and
               Linjie Li and
               Luowei Zhou and
               Zhe Gan and
               Tamara L. Berg and
               Mohit Bansal and
               Jingjing Liu},
  title     = {Less Is More: ClipBERT for Video-and-Language Learning via Sparse
               Sampling},
  booktitle = {CVPR},
  pages     = {7331--7341},
  publisher = {Computer Vision Foundation / {IEEE}},
  year      = {2021},
  url       = {https://openaccess.thecvf.com/content/CVPR2021/html/Lei_Less_Is_More_ClipBERT_for_Video-and-Language_Learning_via_Sparse_Sampling_CVPR_2021_paper.html},
  doi       = {10.1109/CVPR46437.2021.00725},
  timestamp = {Tue, 29 Nov 2022 14:53:03 +0100},
  biburl    = {https://dblp.org/rec/conf/cvpr/LeiLZGBB021.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@article{DBLP:journals/corr/abs-2102-10772,
  author    = {Ronghang Hu and
               Amanpreet Singh},
  title     = {Transformer is All You Need: Multimodal Multitask Learning with a
               Unified Transformer},
  journal   = {CoRR},
  volume    = {abs/2102.10772},
  year      = {2021},
  url       = {https://arxiv.org/abs/2102.10772},
  eprinttype = {arXiv},
  eprint    = {2102.10772},
  timestamp = {Wed, 24 Feb 2021 15:42:45 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2102-10772.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@inproceedings{DBLP:conf/nips/Gan0LZ0020,
  author    = {Zhe Gan and
               Yen{-}Chun Chen and
               Linjie Li and
               Chen Zhu and
               Yu Cheng and
               Jingjing Liu},
  editor    = {Hugo Larochelle and
               Marc'Aurelio Ranzato and
               Raia Hadsell and
               Maria{-}Florina Balcan and
               Hsuan{-}Tien Lin},
  title     = {Large-Scale Adversarial Training for Vision-and-Language Representation
               Learning},
  booktitle = {NeurIPS},
  year      = {2020},
  url       = {https://proceedings.neurips.cc/paper/2020/hash/49562478de4c54fafd4ec46fdb297de5-Abstract.html},
  timestamp = {Tue, 19 Jan 2021 15:57:10 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/Gan0LZ0020.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@inproceedings{DBLP:conf/emnlp/TanB20,
  author    = {Hao Tan and
               Mohit Bansal},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Vokenization: Improving Language Understanding with Contextualized,
               Visual-Grounded Supervision},
  booktitle = {EMNLP},
  pages     = {2066--2080},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.162},
  doi       = {10.18653/v1/2020.emnlp-main.162},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/TanB20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@inproceedings{DBLP:conf/acl/RahmanHLZMMH20,
  author    = {Wasifur Rahman and
               Md. Kamrul Hasan and
               Sangwu Lee and
               AmirAli Bagher Zadeh and
               Chengfeng Mao and
               Louis{-}Philippe Morency and
               Mohammed E. Hoque},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {Integrating Multimodal Information in Large Pretrained Transformers},
  booktitle = {ACL},
  pages     = {2359--2369},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.214},
  doi       = {10.18653/v1/2020.acl-main.214},
  timestamp = {Thu, 17 Nov 2022 11:44:51 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/RahmanHLZMMH20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@inproceedings{DBLP:conf/iclr/SuZCLLWD20,
  author    = {Weijie Su and
               Xizhou Zhu and
               Yue Cao and
               Bin Li and
               Lewei Lu and
               Furu Wei and
               Jifeng Dai},
  title     = {{VL-BERT:} Pre-training of Generic Visual-Linguistic Representations},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2020},
  url       = {https://openreview.net/forum?id=SygXPaEYvH},
  timestamp = {Tue, 12 Apr 2022 21:46:12 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/SuZCLLWD20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@article{DBLP:journals/corr/abs-1908-03557,
  author    = {Liunian Harold Li and
               Mark Yatskar and
               Da Yin and
               Cho{-}Jui Hsieh and
               Kai{-}Wei Chang},
  title     = {VisualBERT: {A} Simple and Performant Baseline for Vision and Language},
  journal   = {CoRR},
  volume    = {abs/1908.03557},
  year      = {2019},
  url       = {http://arxiv.org/abs/1908.03557},
  eprinttype = {arXiv},
  eprint    = {1908.03557},
  timestamp = {Mon, 19 Aug 2019 13:21:03 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1908-03557.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@inproceedings{DBLP:conf/nips/LuBPL19,
  author    = {Jiasen Lu and
               Dhruv Batra and
               Devi Parikh and
               Stefan Lee},
  editor    = {Hanna M. Wallach and
               Hugo Larochelle and
               Alina Beygelzimer and
               Florence d'Alch{\'{e}}{-}Buc and
               Emily B. Fox and
               Roman Garnett},
  title     = {ViLBERT: Pretraining Task-Agnostic Visiolinguistic Representations
               for Vision-and-Language Tasks},
  booktitle = {NeurIPS},
  pages     = {13--23},
  year      = {2019},
  url       = {https://proceedings.neurips.cc/paper/2019/hash/c74d97b01eae257e44aa9d5bade97baf-Abstract.html},
  timestamp = {Mon, 16 May 2022 15:41:51 +0200},
  biburl    = {https://dblp.org/rec/conf/nips/LuBPL19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@inproceedings{DBLP:conf/iccv/SunMV0S19,
  author    = {Chen Sun and
               Austin Myers and
               Carl Vondrick and
               Kevin Murphy and
               Cordelia Schmid},
  title     = {VideoBERT: {A} Joint Model for Video and Language Representation Learning},
  booktitle = {ICCV},
  pages     = {7463--7472},
  publisher = {{IEEE}},
  year      = {2019},
  url       = {https://doi.org/10.1109/ICCV.2019.00756},
  doi       = {10.1109/ICCV.2019.00756},
  timestamp = {Wed, 21 Oct 2020 08:21:21 +0200},
  biburl    = {https://dblp.org/rec/conf/iccv/SunMV0S19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}


// from Zafar Ali


@inproceedings{DBLP:conf/acl/HamLJK20,
  author    = {DongHoon Ham and
               Jeong{-}Gwan Lee and
               Youngsoo Jang and
               Kee{-}Eung Kim},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {End-to-End Neural Pipeline for Goal-Oriented Dialogue Systems using
               {GPT-2}},
  booktitle = {ACL},
  pages     = {583--592},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.54},
  doi       = {10.18653/v1/2020.acl-main.54},
  timestamp = {Fri, 06 Aug 2021 00:40:59 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/HamLJK20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@article{DBLP:journals/corr/abs-2101-09459,
  author    = {Chongming Gao and
               Wenqiang Lei and
               Xiangnan He and
               Maarten de Rijke and
               Tat{-}Seng Chua},
  title     = {Advances and Challenges in Conversational Recommender Systems: {A}
               Survey},
  journal   = {CoRR},
  volume    = {abs/2101.09459},
  year      = {2021},
  url       = {https://arxiv.org/abs/2101.09459},
  eprinttype = {arXiv},
  eprint    = {2101.09459},
  timestamp = {Sat, 30 Jan 2021 18:02:51 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2101-09459.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Recommender System, Survey}
}

@article{DBLP:journals/tkde/GuoZQZXXH22,
  author    = {Qingyu Guo and
               Fuzhen Zhuang and
               Chuan Qin and
               Hengshu Zhu and
               Xing Xie and
               Hui Xiong and
               Qing He},
  title     = {A Survey on Knowledge Graph-Based Recommender Systems},
  journal   = {TKDE},
  volume    = {34},
  number    = {8},
  pages     = {3549--3568},
  year      = {2022},
  url       = {https://doi.org/10.1109/TKDE.2020.3028705},
  doi       = {10.1109/TKDE.2020.3028705},
  timestamp = {Mon, 08 Aug 2022 21:23:43 +0200},
  biburl    = {https://dblp.org/rec/journals/tkde/GuoZQZXXH22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Recommender System, Survey}
}

@inproceedings{DBLP:conf/sigir/YuY00CN22,
  author    = {Junliang Yu and
               Hongzhi Yin and
               Xin Xia and
               Tong Chen and
               Lizhen Cui and
               Quoc Viet Hung Nguyen},
  editor    = {Enrique Amig{\'{o}} and
               Pablo Castells and
               Julio Gonzalo and
               Ben Carterette and
               J. Shane Culpepper and
               Gabriella Kazai},
  title     = {Are Graph Augmentations Necessary?: Simple Graph Contrastive Learning
               for Recommendation},
  booktitle = {SIGIR},
  pages     = {1294--1303},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3477495.3531937},
  doi       = {10.1145/3477495.3531937},
  timestamp = {Wed, 07 Dec 2022 23:08:55 +0100},
  biburl    = {https://dblp.org/rec/conf/sigir/YuY00CN22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Recommender System}
}

@article{guo2022disentangled,
  title={Disentangled Representations Learning for Multi-Target Cross-Domain Recommendation},
  author={Guo, Xiaobo and Li, Shaoshuai and Guo, Naicheng and Cao, Jiangxia and Liu, Xiaolei and Ma, Qiongxu and Gan, Runsheng and Zhao, Yunan},
  journal={TOIS},
  year={2022},
  publisher={ACM New York, NY},
  url={https://dl.acm.org/doi/abs/10.1145/3572835},
  keywords={Recommender System}
}

@article{DBLP:journals/corr/abs-2212-02851,
  author    = {Praveen Venkateswaran and
               Evelyn Duesterwald and
               Vatche Isahagian},
  title     = {DiSTRICT: Dialogue State Tracking with Retriever Driven In-Context
               Tuning},
  journal   = {CoRR},
  volume    = {abs/2212.02851},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.02851},
  doi       = {10.48550/arXiv.2212.02851},
  eprinttype = {arXiv},
  eprint    = {2212.02851},
  timestamp = {Thu, 08 Dec 2022 15:26:56 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-02851.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@inproceedings{DBLP:conf/coling/LeeLC22,
  author    = {Young{-}Jun Lee and
               Chae{-}Gyun Lim and
               Ho{-}Jin Choi},
  editor    = {Nicoletta Calzolari and
               Chu{-}Ren Huang and
               Hansaem Kim and
               James Pustejovsky and
               Leo Wanner and
               Key{-}Sun Choi and
               Pum{-}Mo Ryu and
               Hsin{-}Hsi Chen and
               Lucia Donatelli and
               Heng Ji and
               Sadao Kurohashi and
               Patrizia Paggio and
               Nianwen Xue and
               Seokhwan Kim and
               Younggyun Hahm and
               Zhong He and
               Tony Kyungil Lee and
               Enrico Santus and
               Francis Bond and
               Seung{-}Hoon Na},
  title     = {Does {GPT-3} Generate Empathetic Dialogues? {A} Novel In-Context Example
               Selection Method and Automatic Evaluation Metric for Empathetic Dialogue
               Generation},
  booktitle = {COLING},
  pages     = {669--683},
  publisher = {International Committee on Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.coling-1.56},
  timestamp = {Thu, 13 Oct 2022 17:29:38 +0200},
  biburl    = {https://dblp.org/rec/conf/coling/LeeLC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System, In-Content Learning}
}

@inproceedings{DBLP:conf/emnlp/00010O21,
  author    = {Chia{-}Hsuan Lee and
               Hao Cheng and
               Mari Ostendorf},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Dialogue State Tracking with a Language Model using Schema-Driven
               Prompting},
  booktitle = {EMNLP},
  pages     = {4937--4949},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.404},
  doi       = {10.18653/v1/2021.emnlp-main.404},
  timestamp = {Thu, 20 Jan 2022 10:02:14 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/00010O21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@article{DBLP:journals/corr/abs-2110-08118,
  author    = {Andrea Madotto and
               Zhaojiang Lin and
               Genta Indra Winata and
               Pascale Fung},
  title     = {Few-Shot Bot: Prompt-Based Learning for Dialogue Systems},
  journal   = {CoRR},
  volume    = {abs/2110.08118},
  year      = {2021},
  url       = {https://arxiv.org/abs/2110.08118},
  eprinttype = {arXiv},
  eprint    = {2110.08118},
  timestamp = {Fri, 22 Oct 2021 13:33:09 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2110-08118.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@inproceedings{DBLP:conf/aaai/YoungXPNC22,
  author    = {Tom Young and
               Frank Xing and
               Vlad Pandelea and
               Jinjie Ni and
               Erik Cambria},
  title     = {Fusing Task-Oriented and Open-Domain Dialogues in Conversational Agents},
  booktitle = {AAAI},
  pages     = {11622--11629},
  publisher = {{AAAI} Press},
  year      = {2022},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/21416},
  timestamp = {Tue, 12 Jul 2022 14:14:21 +0200},
  biburl    = {https://dblp.org/rec/conf/aaai/YoungXPNC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@article{DBLP:journals/corr/abs-2206-11309,
  author    = {Baolin Peng and
               Michel Galley and
               Pengcheng He and
               Chris Brockett and
               Lars Liden and
               Elnaz Nouri and
               Zhou Yu and
               Bill Dolan and
               Jianfeng Gao},
  title     = {{GODEL:} Large-Scale Pre-Training for Goal-Directed Dialog},
  journal   = {CoRR},
  volume    = {abs/2206.11309},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2206.11309},
  doi       = {10.48550/arXiv.2206.11309},
  eprinttype = {arXiv},
  eprint    = {2206.11309},
  timestamp = {Mon, 27 Jun 2022 16:51:57 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2206-11309.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@article{DBLP:journals/corr/abs-2212-09252,
  author    = {Sagi Shaier and
               Lawrence Hunter and
               Katharina Kann},
  title     = {Mind the Knowledge Gap: {A} Survey of Knowledge-enhanced Dialogue
               Systems},
  journal   = {CoRR},
  volume    = {abs/2212.09252},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.09252},
  doi       = {10.48550/arXiv.2212.09252},
  eprinttype = {arXiv},
  eprint    = {2212.09252},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-09252.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System, Knowledge Enhanced, Survey}
}

@inproceedings{DBLP:conf/naacl/ChenCYLY21,
  author    = {Derek Chen and
               Howard Chen and
               Yi Yang and
               Alexander Lin and
               Zhou Yu},
  editor    = {Kristina Toutanova and
               Anna Rumshisky and
               Luke Zettlemoyer and
               Dilek Hakkani{-}T{\"{u}}r and
               Iz Beltagy and
               Steven Bethard and
               Ryan Cotterell and
               Tanmoy Chakraborty and
               Yichao Zhou},
  title     = {Action-Based Conversations Dataset: {A} Corpus for Building More In-Depth
               Task-Oriented Dialogue Systems},
  booktitle = {NAACL},
  pages     = {3002--3017},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.naacl-main.239},
  doi       = {10.18653/v1/2021.naacl-main.239},
  timestamp = {Fri, 24 Jun 2022 12:17:37 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/ChenCYLY21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@inproceedings{DBLP:conf/naacl/HanHKKS21,
  author    = {Janghoon Han and
               Taesuk Hong and
               Byoungjae Kim and
               Youngjoong Ko and
               Jungyun Seo},
  editor    = {Kristina Toutanova and
               Anna Rumshisky and
               Luke Zettlemoyer and
               Dilek Hakkani{-}T{\"{u}}r and
               Iz Beltagy and
               Steven Bethard and
               Ryan Cotterell and
               Tanmoy Chakraborty and
               Yichao Zhou},
  title     = {Fine-grained Post-training for Improving Retrieval-based Dialogue
               Systems},
  booktitle = {NAACL},
  pages     = {1549--1558},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.naacl-main.122},
  doi       = {10.18653/v1/2021.naacl-main.122},
  timestamp = {Fri, 06 Aug 2021 00:41:31 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/HanHKKS21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@inproceedings{DBLP:conf/nips/Hosseini-AslMWY20,
  author    = {Ehsan Hosseini{-}Asl and
               Bryan McCann and
               Chien{-}Sheng Wu and
               Semih Yavuz and
               Richard Socher},
  editor    = {Hugo Larochelle and
               Marc'Aurelio Ranzato and
               Raia Hadsell and
               Maria{-}Florina Balcan and
               Hsuan{-}Tien Lin},
  title     = {A Simple Language Model for Task-Oriented Dialogue},
  booktitle = {NeurIPS},
  year      = {2020},
  url       = {https://proceedings.neurips.cc/paper/2020/hash/e946209592563be0f01c844ab2170f0c-Abstract.html},
  timestamp = {Tue, 19 Jan 2021 15:57:40 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/Hosseini-AslMWY20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@inproceedings{DBLP:conf/mm/LiuYLWTZSM21,
  author    = {Yong Liu and
               Susen Yang and
               Chenyi Lei and
               Guoxin Wang and
               Haihong Tang and
               Juyong Zhang and
               Aixin Sun and
               Chunyan Miao},
  editor    = {Heng Tao Shen and
               Yueting Zhuang and
               John R. Smith and
               Yang Yang and
               Pablo C{\'{e}}sar and
               Florian Metze and
               Balakrishnan Prabhakaran},
  title     = {Pre-training Graph Transformer with Multimodal Side Information for
               Recommendation},
  booktitle = {MM},
  pages     = {2853--2861},
  publisher = {{ACM}},
  year      = {2021},
  url       = {https://doi.org/10.1145/3474085.3475709},
  doi       = {10.1145/3474085.3475709},
  timestamp = {Fri, 02 Dec 2022 08:27:05 +0100},
  biburl    = {https://dblp.org/rec/conf/mm/LiuYLWTZSM21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Recommender System, Multimodal}
}

@article{DBLP:journals/corr/abs-2105-04387,
  author    = {Jinjie Ni and
               Tom Young and
               Vlad Pandelea and
               Fuzhao Xue and
               Vinay Adiga and
               Erik Cambria},
  title     = {Recent Advances in Deep Learning Based Dialogue Systems: {A} Systematic
               Survey},
  journal   = {CoRR},
  volume    = {abs/2105.04387},
  year      = {2021},
  url       = {https://arxiv.org/abs/2105.04387},
  eprinttype = {arXiv},
  eprint    = {2105.04387},
  timestamp = {Mon, 31 May 2021 08:19:46 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2105-04387.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System, Survey}
}

@inproceedings{DBLP:conf/sigir/XinPKRCR22,
  author    = {Xin Xin and
               Tiago Pimentel and
               Alexandros Karatzoglou and
               Pengjie Ren and
               Konstantina Christakopoulou and
               Zhaochun Ren},
  editor    = {Enrique Amig{\'{o}} and
               Pablo Castells and
               Julio Gonzalo and
               Ben Carterette and
               J. Shane Culpepper and
               Gabriella Kazai},
  title     = {Rethinking Reinforcement Learning for Recommendation: {A} Prompt Perspective},
  booktitle = {SIGIR},
  pages     = {1347--1357},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3477495.3531714},
  doi       = {10.1145/3477495.3531714},
  timestamp = {Fri, 04 Nov 2022 16:12:03 +0100},
  biburl    = {https://dblp.org/rec/conf/sigir/XinPKRCR22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Recommender System}
}

@inproceedings{DBLP:conf/www/YeMZLY21,
  author    = {Fanghua Ye and
               Jarana Manotumruksa and
               Qiang Zhang and
               Shenghui Li and
               Emine Yilmaz},
  editor    = {Jure Leskovec and
               Marko Grobelnik and
               Marc Najork and
               Jie Tang and
               Leila Zia},
  title     = {Slot Self-Attentive Dialogue State Tracking},
  booktitle = {WWW},
  pages     = {1598--1608},
  publisher = {{ACM} / {IW3C2}},
  year      = {2021},
  url       = {https://doi.org/10.1145/3442381.3449939},
  doi       = {10.1145/3442381.3449939},
  timestamp = {Tue, 14 Sep 2021 14:27:30 +0200},
  biburl    = {https://dblp.org/rec/conf/www/YeMZLY21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@article{DBLP:journals/tacl/LiuYRB21,
  author    = {Qi Liu and
               Lei Yu and
               Laura Rimell and
               Phil Blunsom},
  title     = {Pretraining the Noisy Channel Model for Task-Oriented Dialogue},
  journal   = {TACL},
  volume    = {9},
  pages     = {657--674},
  year      = {2021},
  url       = {https://doi.org/10.1162/tacl\_a\_00390},
  doi       = {10.1162/tacl\_a\_00390},
  timestamp = {Thu, 04 Aug 2022 13:12:54 +0200},
  biburl    = {https://dblp.org/rec/journals/tacl/LiuYRB21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}

@inproceedings{DBLP:conf/aaai/0001SJ20,
  author    = {Tong Yu and
               Yilin Shen and
               Hongxia Jin},
  title     = {Towards Hands-Free Visual Dialog Interactive Recommendation},
  booktitle = {AAAI},
  pages     = {1137--1144},
  publisher = {{AAAI} Press},
  year      = {2020},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/5465},
  timestamp = {Mon, 07 Mar 2022 16:58:16 +0100},
  biburl    = {https://dblp.org/rec/conf/aaai/0001SJ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Recommender System}
}

@inproceedings{DBLP:conf/aaai/YangLQ21,
  author    = {Yunyi Yang and
               Yunhao Li and
               Xiaojun Quan},
  title     = {{UBAR:} Towards Fully End-to-End Task-Oriented Dialog System with
               {GPT-2}},
  booktitle = {AAAI},
  pages     = {14230--14238},
  publisher = {{AAAI} Press},
  year      = {2021},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/17674},
  timestamp = {Mon, 07 Jun 2021 11:46:04 +0200},
  biburl    = {https://dblp.org/rec/conf/aaai/YangLQ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Dialogue System}
}


// 0216 from QI

@inproceedings{DBLP:conf/icer/SarsaDH022,
  author    = {Sami Sarsa and
               Paul Denny and
               Arto Hellas and
               Juho Leinonen},
  editor    = {Jan Vahrenhold and
               Kathi Fisler and
               Matthias Hauswirth and
               Diana Franklin},
  title     = {Automatic Generation of Programming Exercises and Code Explanations
               Using Large Language Models},
  booktitle = {ICER},
  pages     = {27--43},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3501385.3543957},
  doi       = {10.1145/3501385.3543957},
  timestamp = {Wed, 07 Dec 2022 23:07:32 +0100},
  biburl    = {https://dblp.org/rec/conf/icer/SarsaDH022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords = {Program and Code Generation}
}

@article{DBLP:journals/corr/abs-2302-04813,
  author    = {Xi Ye and
               Greg Durrett},
  title     = {Explanation Selection Using Unlabeled Data for In-Context Learning},
  journal   = {CoRR},
  volume    = {abs/2302.04813},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.04813},
  doi       = {10.48550/arXiv.2302.04813},
  eprinttype = {arXiv},
  eprint    = {2302.04813},
  timestamp = {Mon, 13 Feb 2023 14:23:40 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-04813.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}

@article{qin2023chatgpt,
  title={Is ChatGPT a General-Purpose Natural Language Processing Task Solver?},
  author={Qin, Chengwei and Zhang, Aston and Zhang, Zhuosheng and Chen, Jiaao and Yasunaga, Michihiro and Yang, Diyi},
  journal={CoRR},
  year={2023},
  url={https://arxiv.org/abs/2302.06476},
  keywords={Evaluation}
}

@article{DBLP:journals/corr/abs-2301-11596,
  author    = {Simon Ott and
               Konstantin Hebenstreit and
               Valentin Li{\'{e}}vin and
               Christoffer Egeberg Hother and
               Milad Moradi and
               Maximilian Mayrhauser and
               Robert Praas and
               Ole Winther and
               Matthias Samwald},
  title     = {ThoughtSource: {A} central hub for large language model reasoning
               data},
  journal   = {CoRR},
  volume    = {abs/2301.11596},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.11596},
  doi       = {10.48550/arXiv.2301.11596},
  eprinttype = {arXiv},
  eprint    = {2301.11596},
  timestamp = {Tue, 31 Jan 2023 16:32:10 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-11596.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reasoning}
}

@article{DBLP:journals:corr:abs-2302-04931,
  author    = {Mukai Li and
               Shansan Gong and
               Jiangtao Feng and
               Yiheng Xu and
               Jun Zhang and
               Zhiyong Wu and
               Lingpeng Kong},
  title     = {In-Context Learning with Many Demonstration Examples},
  journal   = {CoRR},
  volume    = {abs/2302.04931},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.04931},
  doi       = {10.48550/arXiv.2302.04931},
  eprinttype = {arXiv},
  eprint    = {2302.04931},
  timestamp = {Mon, 13 Feb 2023 14:23:40 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-04931.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}
@String(DBLP:journals:corr:abs-2302-04931="This paper proposes a LM named EvaLM to scale up the sequence length (trained with 8k tokens per batch line). Experiments based on EvaLM prove that in-context learning can achieve higher performance with more demonstrations under many-shot instruction tuning (8k) and further extending the length of instructions (16k) can further improve the upper bound of scaling in-context  learning.")

@article{DBLP:journals/corr/abs-2302-00093,
  author    = {Freda Shi and
               Xinyun Chen and
               Kanishka Misra and
               Nathan Scales and
               David Dohan and
               Ed H. Chi and
               Nathanael Sch{\"{a}}rli and
               Denny Zhou},
  title     = {Large Language Models Can Be Easily Distracted by Irrelevant Context},
  journal   = {CoRR},
  volume    = {abs/2302.00093},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.00093},
  doi       = {10.48550/arXiv.2302.00093},
  eprinttype = {arXiv},
  eprint    = {2302.00093},
  timestamp = {Thu, 09 Feb 2023 16:11:17 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-00093.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Instruction Tuning}
}

@inproceedings{DBLP:conf/acl/GongZZSWW22,
  author    = {Zheng Gong and
               Kun Zhou and
               Xin Zhao and
               Jing Sha and
               Shijin Wang and
               Ji{-}Rong Wen},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Continual Pre-training of Language Models for Math Problem Understanding
               with Syntax-Aware Memory Network},
  booktitle = {ACL},
  pages     = {5923--5933},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.408},
  doi       = {10.18653/v1/2022.acl-long.408},
  timestamp = {Mon, 01 Aug 2022 16:27:47 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/GongZZSWW22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Continual Learning}
}

@article{DBLP:journals/corr/abs-2301-05578,
  author    = {Justin D. Weisz and
               Michael J. Muller and
               Jessica He and
               Stephanie Houde},
  title     = {Toward General Design Principles for Generative {AI} Applications},
  journal   = {CoRR},
  volume    = {abs/2301.05578},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.05578},
  doi       = {10.48550/arXiv.2301.05578},
  eprinttype = {arXiv},
  eprint    = {2301.05578},
  timestamp = {Thu, 19 Jan 2023 15:40:01 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-05578.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Others}
}

@inproceedings{DBLP:conf/emnlp/Ye0CC22,
  author    = {Hongbin Ye and
               Ningyu Zhang and
               Hui Chen and
               Huajun Chen},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Generative Knowledge Graph Construction: {A} Review},
  booktitle = {EMNLP},
  pages     = {1--17},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.1},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/Ye0CC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}

@article{DBLP:journals/corr/abs-2209-07686,
  author    = {Aman Madaan and
               Amir Yazdanbakhsh},
  title     = {Text and Patterns: For Effective Chain of Thought, It Takes Two to
               Tango},
  journal   = {CoRR},
  volume    = {abs/2209.07686},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2209.07686},
  doi       = {10.48550/arXiv.2209.07686},
  eprinttype = {arXiv},
  eprint    = {2209.07686},
  timestamp = {Tue, 27 Sep 2022 16:29:43 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2209-07686.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2212-10001,
  author    = {Boshi Wang and
               Sewon Min and
               Xiang Deng and
               Jiaming Shen and
               You Wu and
               Luke Zettlemoyer and
               Huan Sun},
  title     = {Towards Understanding Chain-of-Thought Prompting: An Empirical Study
               of What Matters},
  journal   = {CoRR},
  volume    = {abs/2212.10001},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10001},
  doi       = {10.48550/arXiv.2212.10001},
  eprinttype = {arXiv},
  eprint    = {2212.10001},
  timestamp = {Tue, 03 Jan 2023 15:59:43 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10001.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2210-09150,
  author    = {Chenglei Si and
               Zhe Gan and
               Zhengyuan Yang and
               Shuohang Wang and
               Jianfeng Wang and
               Jordan L. Boyd{-}Graber and
               Lijuan Wang},
  title     = {Prompting {GPT-3} To Be Reliable},
  journal   = {CoRR},
  volume    = {abs/2210.09150},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.09150},
  doi       = {10.48550/arXiv.2210.09150},
  eprinttype = {arXiv},
  eprint    = {2210.09150},
  timestamp = {Wed, 19 Oct 2022 12:47:31 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-09150.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reliability}
}

@article{DBLP:journals/corr/abs-2204-02311,
  author    = {Aakanksha Chowdhery and
               Sharan Narang and
               Jacob Devlin and
               Maarten Bosma and
               Gaurav Mishra and
               Adam Roberts and
               Paul Barham and
               Hyung Won Chung and
               Charles Sutton and
               Sebastian Gehrmann and
               Parker Schuh and
               Kensen Shi and
               Sasha Tsvyashchenko and
               Joshua Maynez and
               Abhishek Rao and
               Parker Barnes and
               Yi Tay and
               Noam Shazeer and
               Vinodkumar Prabhakaran and
               Emily Reif and
               Nan Du and
               Ben Hutchinson and
               Reiner Pope and
               James Bradbury and
               Jacob Austin and
               Michael Isard and
               Guy Gur{-}Ari and
               Pengcheng Yin and
               Toju Duke and
               Anselm Levskaya and
               Sanjay Ghemawat and
               Sunipa Dev and
               Henryk Michalewski and
               Xavier Garcia and
               Vedant Misra and
               Kevin Robinson and
               Liam Fedus and
               Denny Zhou and
               Daphne Ippolito and
               David Luan and
               Hyeontaek Lim and
               Barret Zoph and
               Alexander Spiridonov and
               Ryan Sepassi and
               David Dohan and
               Shivani Agrawal and
               Mark Omernick and
               Andrew M. Dai and
               Thanumalayan Sankaranarayana Pillai and
               Marie Pellat and
               Aitor Lewkowycz and
               Erica Moreira and
               Rewon Child and
               Oleksandr Polozov and
               Katherine Lee and
               Zongwei Zhou and
               Xuezhi Wang and
               Brennan Saeta and
               Mark Diaz and
               Orhan Firat and
               Michele Catasta and
               Jason Wei and
               Kathy Meier{-}Hellstern and
               Douglas Eck and
               Jeff Dean and
               Slav Petrov and
               Noah Fiedel},
  title     = {PaLM: Scaling Language Modeling with Pathways},
  journal   = {CoRR},
  volume    = {abs/2204.02311},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2204.02311},
  doi       = {10.48550/arXiv.2204.02311},
  eprinttype = {arXiv},
  eprint    = {2204.02311},
  timestamp = {Tue, 16 Aug 2022 23:07:05 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2204-02311.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}


// from Zhang Yuxin

@inproceedings{DBLP:conf/acl/YangFQKL19,
  author    = {Sen Yang and
               Dawei Feng and
               Linbo Qiao and
               Zhigang Kan and
               Dongsheng Li},
  editor    = {Anna Korhonen and
               David R. Traum and
               Llu{\'{\i}}s M{\`{a}}rquez},
  title     = {Exploring Pre-trained Language Models for Event Extraction and Generation},
  booktitle = {ACL},
  pages     = {5284--5294},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/p19-1522},
  doi       = {10.18653/v1/p19-1522},
  timestamp = {Fri, 06 Aug 2021 00:41:01 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/YangFQKL19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/acl-louhi/WangWL20,
  author    = {Xing David Wang and
               Leon Weber and
               Ulf Leser},
  editor    = {Eben Holderness and
               Antonio Jimeno{-}Yepes and
               Alberto Lavelli and
               Anne{-}Lyse Minard and
               James Pustejovsky and
               Fabio Rinaldi},
  title     = {Biomedical Event Extraction as Multi-turn Question Answering},
  booktitle = {EMNLP},
  pages     = {88--96},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.louhi-1.10},
  doi       = {10.18653/v1/2020.louhi-1.10},
  timestamp = {Fri, 06 Aug 2021 00:41:34 +0200},
  biburl    = {https://dblp.org/rec/conf/acl-louhi/WangWL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/emnlp/ZhangYZ20,
  author    = {Rongzhi Zhang and
               Yue Yu and
               Chao Zhang},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {SeqMix: Augmenting Active Sequence Labeling via Sequence Mixup},
  booktitle = {EMNLP},
  pages     = {8566--8579},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.691},
  doi       = {10.18653/v1/2020.emnlp-main.691},
  timestamp = {Sun, 02 Oct 2022 16:00:27 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/ZhangYZ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Extraction, Data Argumentation}
}

@inproceedings{DBLP:conf/acl/VeysehLDN20,
  author    = {Amir Pouran Ben Veyseh and
               Viet Dac Lai and
               Franck Dernoncourt and
               Thien Huu Nguyen},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Unleash {GPT-2} Power for Event Detection},
  booktitle = {ACL},
  pages     = {6271--6282},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.490},
  doi       = {10.18653/v1/2021.acl-long.490},
  timestamp = {Fri, 28 Jan 2022 23:51:19 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/VeysehLDN20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/emnlp/LiuCX21,
  author    = {Jian Liu and
               Yufeng Chen and
               Jinan Xu},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Machine Reading Comprehension as Data Augmentation: {A} Case Study
               on Implicit Event Argument Extraction},
  booktitle = {EMNLP},
  pages     = {2716--2725},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.214},
  doi       = {10.18653/v1/2021.emnlp-main.214},
  timestamp = {Thu, 20 Jan 2022 10:02:36 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/LiuCX21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/emnlp/VeysehNNMN21,
  author    = {Amir Pouran Ben Veyseh and
               Minh Van Nguyen and
               Nghia Trung Ngo and
               Bonan Min and
               Thien Huu Nguyen},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Modeling Document-Level Context for Event Detection via Important
               Context Selection},
  booktitle = {EMNLP},
  pages     = {5403--5413},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.439},
  doi       = {10.18653/v1/2021.emnlp-main.439},
  timestamp = {Thu, 20 Jan 2022 10:02:33 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/VeysehNNMN21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/naacl/Guzman-NaterasN22,
  author    = {Luis Guzman{-}Nateras and
               Minh Van Nguyen and
               Thien Nguyen},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Cross-Lingual Event Detection via Optimized Adversarial Training},
  booktitle = {NAACL},
  pages     = {5588--5599},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.409},
  doi       = {10.18653/v1/2022.naacl-main.409},
  timestamp = {Mon, 01 Aug 2022 16:28:00 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/Guzman-NaterasN22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/starsem/VeysehN22,
  author    = {Amir Pouran Ben Veyseh and
               Thien Huu Nguyen},
  editor    = {Vivi Nastase and
               Ellie Pavlick and
               Mohammad Taher Pilehvar and
               Jos{\'{e}} Camacho{-}Collados and
               Alessandro Raganato},
  title     = {Word-Label Alignment for Event Detection: {A} New Perspective via
               Optimal Transport},
  booktitle = {NAACL},
  pages     = {132--138},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.starsem-1.11},
  doi       = {10.18653/v1/2022.starsem-1.11},
  timestamp = {Mon, 26 Sep 2022 16:58:59 +0200},
  biburl    = {https://dblp.org/rec/conf/starsem/VeysehN22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/emnlp/NguyenMDN22,
  author    = {Minh Van Nguyen and
               Bonan Min and
               Franck Dernoncourt and
               Thien Nguyen},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Learning Cross-Task Dependencies for Joint Extraction of Entities,
               Events, Event Arguments, and Relations},
  booktitle = {EMNLP},
  pages     = {9349--9360},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.634},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/NguyenMDN22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Extraction, Event Relation Extraction}
}

@inproceedings{DBLP:conf/pkdd/VeysehNMN21,
  author    = {Amir Pouran Ben Veyseh and
               Minh Van Nguyen and
               Bonan Min and
               Thien Huu Nguyen},
  editor    = {Nuria Oliver and
               Fernando P{\'{e}}rez{-}Cruz and
               Stefan Kramer and
               Jesse Read and
               Jos{\'{e}} Antonio Lozano},
  title     = {Augmenting Open-Domain Event Detection with Synthetic Data from {GPT-2}},
  booktitle = {ECML},
  series    = {Lecture Notes in Computer Science},
  volume    = {12977},
  pages     = {644--660},
  publisher = {Springer},
  year      = {2021},
  url       = {https://doi.org/10.1007/978-3-030-86523-8\_39},
  doi       = {10.1007/978-3-030-86523-8\_39},
  timestamp = {Mon, 24 Jan 2022 07:48:09 +0100},
  biburl    = {https://dblp.org/rec/conf/pkdd/VeysehNMN21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Extraction}
}

@inproceedings{DBLP:conf/cvpr/LiXWZ0Z0JC22,
  author    = {Manling Li and
               Ruochen Xu and
               Shuohang Wang and
               Luowei Zhou and
               Xudong Lin and
               Chenguang Zhu and
               Michael Zeng and
               Heng Ji and
               Shih{-}Fu Chang},
  title     = {CLIP-Event: Connecting Text and Images with Event Structures},
  booktitle = {CVPR},
  pages     = {16399--16408},
  publisher = {{IEEE}},
  year      = {2022},
  url       = {https://doi.org/10.1109/CVPR52688.2022.01593},
  doi       = {10.1109/CVPR52688.2022.01593},
  timestamp = {Wed, 23 Nov 2022 16:47:01 +0100},
  biburl    = {https://dblp.org/rec/conf/cvpr/LiXWZ0Z0JC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Extraction, Multimodal}
}

@inproceedings{DBLP:conf/aaai/ManNVN22,
  author    = {Hieu Man and
               Nghia Trung Ngo and
               Linh Ngo Van and
               Thien Huu Nguyen},
  title     = {Selecting Optimal Context Sentences for Event-Event Relation Extraction},
  booktitle = {AAAI},
  pages     = {11058--11066},
  publisher = {{AAAI} Press},
  year      = {2022},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/21354},
  timestamp = {Tue, 12 Jul 2022 14:14:21 +0200},
  biburl    = {https://dblp.org/rec/conf/aaai/ManNVN22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Relation Extraction}
}

@inproceedings{DBLP:conf/emnlp/ZhangCM21,
  author    = {Xiyang Zhang and
               Muhao Chen and
               Jonathan May},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Salience-Aware Event Chain Modeling for Narrative Understanding},
  booktitle = {EMNLP},
  pages     = {1418--1428},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.107},
  doi       = {10.18653/v1/2021.emnlp-main.107},
  timestamp = {Thu, 20 Jan 2022 10:02:19 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ZhangCM21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Relation Extraction}
}

@inproceedings{DBLP:conf/emnlp/LaiMVDN22,
  author    = {Viet Dac Lai and
               Hieu Man and
               Linh Ngo Van and
               Franck Dernoncourt and
               Thien Nguyen},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Multilingual SubEvent Relation Extraction: {A} Novel Dataset and Structure
               Induction Method},
  booktitle = {EMNLP Findings},
  pages     = {5559--5570},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.407},
  timestamp = {Tue, 07 Feb 2023 17:10:52 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/LaiMVDN22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Relation Extraction}
}

@inproceedings{DBLP:conf/emnlp/WangCZR20,
  author    = {Haoyu Wang and
               Muhao Chen and
               Hongming Zhang and
               Dan Roth},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Joint Constrained Learning for Event-Event Relation Extraction},
  booktitle = {EMNLP},
  pages     = {696--706},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.51},
  doi       = {10.18653/v1/2020.emnlp-main.51},
  timestamp = {Fri, 20 Jan 2023 11:25:15 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/WangCZR20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Relation Extraction}
}

@inproceedings{DBLP:conf/coling/ShenZWQ22,
  author    = {Shirong Shen and
               Heng Zhou and
               Tongtong Wu and
               Guilin Qi},
  editor    = {Nicoletta Calzolari and
               Chu{-}Ren Huang and
               Hansaem Kim and
               James Pustejovsky and
               Leo Wanner and
               Key{-}Sun Choi and
               Pum{-}Mo Ryu and
               Hsin{-}Hsi Chen and
               Lucia Donatelli and
               Heng Ji and
               Sadao Kurohashi and
               Patrizia Paggio and
               Nianwen Xue and
               Seokhwan Kim and
               Younggyun Hahm and
               Zhong He and
               Tony Kyungil Lee and
               Enrico Santus and
               Francis Bond and
               Seung{-}Hoon Na},
  title     = {Event Causality Identification via Derivative Prompt Joint Learning},
  booktitle = {COLING},
  pages     = {2288--2299},
  publisher = {International Committee on Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.coling-1.200},
  timestamp = {Thu, 13 Oct 2022 17:29:38 +0200},
  biburl    = {https://dblp.org/rec/conf/coling/ShenZWQ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Event Relation Extraction}
}


// 0217 from QI

@inproceedings{zhang2022improved,
  title={Improved logical reasoning of language models via differentiable symbolic programming},
  author={Zhang, Hanlin and Li, Ziyang and Huang, Jiani and Naik, Mayur and Xing, Eric},
  booktitle={ICML},
  year={2022},
  url={https://openreview.net/forum?id=8lNy3QCaxHX},
  keywords={Symbolic Reasoning}
}

@inproceedings{DBLP:conf/emnlp/MishraFLTWBRTSC22,
  author    = {Swaroop Mishra and
               Matthew Finlayson and
               Pan Lu and
               Leonard Tang and
               Sean Welleck and
               Chitta Baral and
               Tanmay Rajpurohit and
               Oyvind Tafjord and
               Ashish Sabharwal and
               Peter Clark and
               Ashwin Kalyan},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {{LILA:} {A} Unified Benchmark for Mathematical Reasoning},
  booktitle = {EMNLP},
  pages     = {5807--5832},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.392},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/MishraFLTWBRTSC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Arithmetic Reasoning}
}

@inproceedings{DBLP:conf/emnlp/JungQWBB0C22,
  author    = {Jaehun Jung and
               Lianhui Qin and
               Sean Welleck and
               Faeze Brahman and
               Chandra Bhagavatula and
               Ronan Le Bras and
               Yejin Choi},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Maieutic Prompting: Logically Consistent Reasoning with Recursive
               Explanations},
  booktitle = {EMNLP},
  pages     = {1266--1279},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.82},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/JungQWBB0C22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Symbolic Reasoning}
}

@article{DBLP:journals/corr/abs-2302-02093,
  author    = {Tanmoy Chowdhury and
               Chen Ling and
               Xuchao Zhang and
               Xujiang Zhao and
               Guangji Bai and
               Jian Pei and
               Haifeng Chen and
               Liang Zhao},
  title     = {Knowledge-enhanced Neural Machine Reasoning: {A} Review},
  journal   = {CoRR},
  volume    = {abs/2302.02093},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.02093},
  doi       = {10.48550/arXiv.2302.02093},
  eprinttype = {arXiv},
  eprint    = {2302.02093},
  timestamp = {Fri, 10 Feb 2023 12:26:38 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-02093.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reasoning, Knowledge Enhanced}
}

@article{DBLP:journals/corr/abs-2212-13894,
  author    = {Seyed Mehran Kazemi and
               Najoung Kim and
               Deepti Bhatia and
               Xin Xu and
               Deepak Ramachandran},
  title     = {{LAMBADA:} Backward Chaining for Automated Reasoning in Natural Language},
  journal   = {CoRR},
  volume    = {abs/2212.13894},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.13894},
  doi       = {10.48550/arXiv.2212.13894},
  eprinttype = {arXiv},
  eprint    = {2212.13894},
  timestamp = {Thu, 05 Jan 2023 12:00:28 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-13894.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2301-13808,
  author    = {Yunhu Ye and
               Binyuan Hui and
               Min Yang and
               Binhua Li and
               Fei Huang and
               Yongbin Li},
  title     = {Large Language Models are Versatile Decomposers: Decompose Evidence
               and Questions for Table-based Reasoning},
  journal   = {CoRR},
  volume    = {abs/2301.13808},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.13808},
  doi       = {10.48550/arXiv.2301.13808},
  eprinttype = {arXiv},
  eprint    = {2301.13808},
  timestamp = {Thu, 02 Feb 2023 12:02:45 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-13808.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reasoning}
}

@article{DBLP:journals/corr/abs-2212-08607,
  author    = {Swarnadeep Saha and
               Xinyan Velocity Yu and
               Mohit Bansal and
               Ramakanth Pasunuru and
               Asli Celikyilmaz},
  title     = {{MURMUR:} Modular Multi-Step Reasoning for Semi-Structured Data-to-Text
               Generation},
  journal   = {CoRR},
  volume    = {abs/2212.08607},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.08607},
  doi       = {10.48550/arXiv.2212.08607},
  eprinttype = {arXiv},
  eprint    = {2212.08607},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-08607.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multi-Step Reasoning}
}

@article{DBLP:journals/corr/abs-2211-12588,
  author    = {Wenhu Chen and
               Xueguang Ma and
               Xinyi Wang and
               William W. Cohen},
  title     = {Program of Thoughts Prompting: Disentangling Computation from Reasoning
               for Numerical Reasoning Tasks},
  journal   = {CoRR},
  volume    = {abs/2211.12588},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.12588},
  doi       = {10.48550/arXiv.2211.12588},
  eprinttype = {arXiv},
  eprint    = {2211.12588},
  timestamp = {Tue, 29 Nov 2022 17:41:18 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-12588.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Arithmetic Reasoning}
}

@article{DBLP:journals/corr/abs-2301-12726,
  author    = {Yao Fu and
               Hao Peng and
               Litu Ou and
               Ashish Sabharwal and
               Tushar Khot},
  title     = {Specializing Smaller Language Models towards Multi-Step Reasoning},
  journal   = {CoRR},
  volume    = {abs/2301.12726},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.12726},
  doi       = {10.48550/arXiv.2301.12726},
  eprinttype = {arXiv},
  eprint    = {2301.12726},
  timestamp = {Wed, 01 Feb 2023 14:38:31 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-12726.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multi-Step Reasoning}
}

@article{DBLP:journals/corr/abs-2212-08686,
  author    = {Hanlin Zhang and
               Yi{-}Fan Zhang and
               Li Erran Li and
               Eric P. Xing},
  title     = {The Impact of Symbolic Representations on In-context Learning for
               Few-shot Reasoning},
  journal   = {CoRR},
  volume    = {abs/2212.08686},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.08686},
  doi       = {10.48550/arXiv.2212.08686},
  eprinttype = {arXiv},
  eprint    = {2212.08686},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-08686.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Symbolic Reasoning, In-Context Learning}
}

@article{DBLP:journals/corr/abs-2212-10403,
  author    = {Jie Huang and
               Kevin Chen{-}Chuan Chang},
  title     = {Towards Reasoning in Large Language Models: {A} Survey},
  journal   = {CoRR},
  volume    = {abs/2212.10403},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10403},
  doi       = {10.48550/arXiv.2212.10403},
  eprinttype = {arXiv},
  eprint    = {2212.10403},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10403.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reasoning, Survey}
}

@inproceedings{DBLP:conf/emnlp/ChenLQLLCL22,
  author    = {Jiaqi Chen and
               Tong Li and
               Jinghui Qin and
               Pan Lu and
               Liang Lin and
               Chongyu Chen and
               Xiaodan Liang},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {UniGeo: Unifying Geometry Logical Reasoning via Reformulating Mathematical
               Expression},
  booktitle = {EMNLP},
  pages     = {3313--3323},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.218},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ChenLQLLCL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Symbolic Reasoning}
}

@article{DBLP:journals:corr:abs-2205-10625,
  author    = {Denny Zhou and
               Nathanael Sch{\"{a}}rli and
               Le Hou and
               Jason Wei and
               Nathan Scales and
               Xuezhi Wang and
               Dale Schuurmans and
               Olivier Bousquet and
               Quoc Le and
               Ed H. Chi},
  title     = {Least-to-Most Prompting Enables Complex Reasoning in Large Language
               Models},
  journal   = {CoRR},
  volume    = {abs/2205.10625},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2205.10625},
  doi       = {10.48550/arXiv.2205.10625},
  eprinttype = {arXiv},
  eprint    = {2205.10625},
  timestamp = {Wed, 01 Jun 2022 14:15:16 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2205-10625.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reasoning, Prompt Engineering}
}
@String(DBLP:journals:corr:abs-2205-10625="(1) 两阶段的prompt，第一阶段问题分解（通过in-context learning实现，context中包含了其他问题的分解示例），对于每个问题，分解出回答该问题需要先回答什么子问题；
(2) 在第二阶段中，从后往前依次解决子问题，同样通过in-context learing得到，每次LLM的回答会参与组成下一个问题的prompt。")

// 0218

@article{DBLP:journals/corr/abs-2207-00747,
  author    = {Xuezhi Wang and
               Jason Wei and
               Dale Schuurmans and
               Quoc V. Le and
               Ed H. Chi and
               Denny Zhou},
  title     = {Rationale-Augmented Ensembles in Language Models},
  journal   = {CoRR},
  volume    = {abs/2207.00747},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2207.00747},
  doi       = {10.48550/arXiv.2207.00747},
  eprinttype = {arXiv},
  eprint    = {2207.00747},
  timestamp = {Wed, 06 Jul 2022 15:50:43 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2207-00747.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multi-Step Reasoning}
}

@inproceedings{DBLP:conf/coling/YangS22,
  author    = {Hsiu{-}Yu Yang and
               Carina Silberer},
  editor    = {Nicoletta Calzolari and
               Chu{-}Ren Huang and
               Hansaem Kim and
               James Pustejovsky and
               Leo Wanner and
               Key{-}Sun Choi and
               Pum{-}Mo Ryu and
               Hsin{-}Hsi Chen and
               Lucia Donatelli and
               Heng Ji and
               Sadao Kurohashi and
               Patrizia Paggio and
               Nianwen Xue and
               Seokhwan Kim and
               Younggyun Hahm and
               Zhong He and
               Tony Kyungil Lee and
               Enrico Santus and
               Francis Bond and
               Seung{-}Hoon Na},
  title     = {Are Visual-Linguistic Models Commonsense Knowledge Bases?},
  booktitle = {COLING},
  pages     = {5542--5559},
  publisher = {International Committee on Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.coling-1.491},
  timestamp = {Thu, 13 Oct 2022 17:29:38 +0200},
  biburl    = {https://dblp.org/rec/conf/coling/YangS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation, Multimodal}
}

@inproceedings{DBLP:conf:acl-deelio:LiuSZDCC22,
  author    = {Jiachang Liu and
               Dinghan Shen and
               Yizhe Zhang and
               Bill Dolan and
               Lawrence Carin and
               Weizhu Chen},
  editor    = {Eneko Agirre and
               Marianna Apidianaki and
               Ivan Vulic},
  title     = {What Makes Good In-Context Examples for GPT-3?},
  booktitle = {NAACL},
  pages     = {100--114},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.deelio-1.10},
  doi       = {10.18653/v1/2022.deelio-1.10},
  timestamp = {Mon, 01 Aug 2022 16:28:08 +0200},
  biburl    = {https://dblp.org/rec/conf/acl-deelio/LiuSZDCC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning},
  code={https://github.com/jiachangliu/KATEGPT3},
  plm={RoBERTa, T5, SBERT, GPT-3}
}
@String(DBLP:conf:acl-deelio:LiuSZDCC22="(1) 探索了在in-context learning中什么样的demonstration example可以对GPT-3的效果取得帮助；
(2) 利用roberta对样本进行编码，并计算demonstration与test example的向量距离（欧氏距离），最终发现与test example越相近的demonstration越能取得较好的效果。")

@inproceedings{DBLP:conf/icse/CiborowskaD22,
  author    = {Agnieszka Ciborowska and
               Kostadin Damevski},
  title     = {Fast Changeset-based Bug Localization with {BERT}},
  booktitle = {ICSE},
  pages     = {946--957},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3510003.3510042},
  doi       = {10.1145/3510003.3510042},
  timestamp = {Mon, 18 Jul 2022 16:47:42 +0200},
  biburl    = {https://dblp.org/rec/conf/icse/CiborowskaD22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Code Fixing}
}

@article{zelikman2022star,
  title={Star: Self-taught reasoner bootstrapping reasoning with reasoning},
  author={Zelikman, Eric and Mu, Jesse and Goodman, Noah D and Wu, Yuhuai Tony},
  year={2022},
  url={https://research.google/pubs/pub51694/},
  booktitle={NeurIPS},
  keywords={Chain of Thought}
}

@inproceedings{DBLP:conf/acl/YaoHWDW21,
  author    = {Yunzhi Yao and
               Shaohan Huang and
               Wenhui Wang and
               Li Dong and
               Furu Wei},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained
               Language Models for Domains},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {460--470},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.40},
  doi       = {10.18653/v1/2021.findings-acl.40},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/YaoHWDW21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Distillation}
}

@inproceedings{DBLP:conf/acl/DiaoXSJSZ20,
  author    = {Shizhe Diao and
               Ruijia Xu and
               Hongjin Su and
               Yilei Jiang and
               Yan Song and
               Tong Zhang},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Taming Pre-trained Language Models with N-gram Representations for
               Low-Resource Domain Adaptation},
  booktitle = {ACL},
  pages     = {3336--3349},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.259},
  doi       = {10.18653/v1/2021.acl-long.259},
  timestamp = {Wed, 08 Feb 2023 17:00:36 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/DiaoXSJSZ20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Distillation}
}

@inproceedings{DBLP:conf/bionlp/YuanLTHH21,
  author    = {Zheng Yuan and
               Yijia Liu and
               Chuanqi Tan and
               Songfang Huang and
               Fei Huang},
  editor    = {Dina Demner{-}Fushman and
               Kevin Bretonnel Cohen and
               Sophia Ananiadou and
               Junichi Tsujii},
  title     = {Improving Biomedical Pretrained Language Models with Knowledge},
  booktitle = {NAACL},
  pages     = {180--190},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.bionlp-1.20},
  doi       = {10.18653/v1/2021.bionlp-1.20},
  timestamp = {Fri, 06 Aug 2021 00:41:22 +0200},
  biburl    = {https://dblp.org/rec/conf/bionlp/YuanLTHH21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced}
}

@inproceedings{DBLP:conf/coling/LiuJL22,
  author    = {Kesong Liu and
               Jianhui Jiang and
               Feifei Lyu},
  editor    = {Nicoletta Calzolari and
               Chu{-}Ren Huang and
               Hansaem Kim and
               James Pustejovsky and
               Leo Wanner and
               Key{-}Sun Choi and
               Pum{-}Mo Ryu and
               Hsin{-}Hsi Chen and
               Lucia Donatelli and
               Heng Ji and
               Sadao Kurohashi and
               Patrizia Paggio and
               Nianwen Xue and
               Seokhwan Kim and
               Younggyun Hahm and
               Zhong He and
               Tony Kyungil Lee and
               Enrico Santus and
               Francis Bond and
               Seung{-}Hoon Na},
  title     = {A Domain Knowledge Enhanced Pre-Trained Language Model for Vertical
               Search: Case Study on Medicinal Products},
  booktitle = {COLING},
  pages     = {1014--1023},
  publisher = {International Committee on Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.coling-1.85},
  timestamp = {Thu, 13 Oct 2022 17:29:38 +0200},
  biburl    = {https://dblp.org/rec/conf/coling/LiuJL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced, Domain Adaptive}
}

@inproceedings{DBLP:conf/emnlp/WangHQSWLG22,
  author    = {Jianing Wang and
               Wenkang Huang and
               Minghui Qiu and
               Qiuhui Shi and
               Hongbin Wang and
               Xiang Li and
               Ming Gao},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Knowledge Prompting in Pre-trained Language Model for Natural Language
               Understanding},
  booktitle = {EMNLP},
  pages     = {3164--3177},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.207},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/WangHQSWLG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced, Natural Language Understanding}
}

@inproceedings{DBLP:conf/emnlp/AgrawalHLKS22,
  author    = {Monica Agrawal and
               Stefan Hegselmann and
               Hunter Lang and
               Yoon Kim and
               David A. Sontag},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Large language models are few-shot clinical information extractors},
  booktitle = {EMNLP},
  pages     = {1998--2022},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.130},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/AgrawalHLKS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Information Extraction}
}

@inproceedings{DBLP:conf/emnlp/ChengHLZ0WDZ22,
  author    = {Daixuan Cheng and
               Shaohan Huang and
               Jianfeng Liu and
               Yuefeng Zhan and
               Hao Sun and
               Furu Wei and
               Denvy Deng and
               Qi Zhang},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Snapshot-Guided Domain Adaptation for {ELECTRA}},
  booktitle = {EMNLP Findings},
  pages     = {2226--2232},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.163},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ChengHLZ0WDZ22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Domain Adaptive}
}

@inproceedings{DBLP:conf/emnlp/GutierrezMWCLS022,
  author    = {Bernal Jimenez Gutierrez and
               Nikolas McNeal and
               Clayton Washington and
               You Chen and
               Lang Li and
               Huan Sun and
               Yu Su},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Thinking about {GPT-3} In-Context Learning for Biomedical IE? Think
               Again},
  booktitle = {EMNLP Findings},
  pages     = {4497--4512},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.329},
  timestamp = {Tue, 07 Feb 2023 17:10:52 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/GutierrezMWCLS022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Information Extraction, In-Context Learning}
}

@inproceedings{DBLP:conf/emnlp/0001HDZJMS22,
  author    = {Dou Hu and
               Xiaolong Hou and
               Xiyang Du and
               Mengyuan Zhou and
               Lianxin Jiang and
               Yang Mo and
               Xiaofeng Shi},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {VarMAE: Pre-training of Variational Masked Autoencoder for Domain-adaptive
               Language Understanding},
  booktitle = {EMNLP Findings},
  pages     = {6276--6286},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.468},
  timestamp = {Tue, 07 Feb 2023 17:10:52 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/0001HDZJMS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Natural Language Understanding, Domain Adaptive}
}

@article{DBLP:journals/corr/abs-2210-01240,
  author    = {Abulhair Saparov and
               He He},
  title     = {Language Models Are Greedy Reasoners: {A} Systematic Formal Analysis
               of Chain-of-Thought},
  journal   = {CoRR},
  volume    = {abs/2210.01240},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.01240},
  doi       = {10.48550/arXiv.2210.01240},
  eprinttype = {arXiv},
  eprint    = {2210.01240},
  timestamp = {Fri, 07 Oct 2022 15:24:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-01240.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@inproceedings{DBLP:conf/chi/ReynoldsM21,
  author    = {Laria Reynolds and
               Kyle McDonell},
  editor    = {Yoshifumi Kitamura and
               Aaron Quigley and
               Katherine Isbister and
               Takeo Igarashi},
  title     = {Prompt Programming for Large Language Models: Beyond the Few-Shot
               Paradigm},
  booktitle = {CHI},
  pages     = {314:1--314:7},
  publisher = {{ACM}},
  year      = {2021},
  url       = {https://doi.org/10.1145/3411763.3451760},
  doi       = {10.1145/3411763.3451760},
  timestamp = {Wed, 19 May 2021 12:29:49 +0200},
  biburl    = {https://dblp.org/rec/conf/chi/ReynoldsM21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/evoW/KrolLM22,
  author    = {Stephen James Krol and
               Maria Teresa Llano and
               Jon McCormack},
  editor    = {Tiago Martins and
               Nereida Rodr{\'{\i}}guez{-}Fern{\'{a}}ndez and
               S{\'{e}}rgio M. Rebelo},
  title     = {Towards the Generation of Musical Explanations with {GPT-3}},
  booktitle = {EvoMUSART},
  series    = {Lecture Notes in Computer Science},
  volume    = {13221},
  pages     = {131--147},
  publisher = {Springer},
  year      = {2022},
  url       = {https://doi.org/10.1007/978-3-031-03789-4\_9},
  doi       = {10.1007/978-3-031-03789-4\_9},
  timestamp = {Fri, 22 Apr 2022 19:18:40 +0200},
  biburl    = {https://dblp.org/rec/conf/evoW/KrolLM22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Application}
}

@article{DBLP:journals/corr/abs-2302-05442,
  author    = {Mostafa Dehghani and
               Josip Djolonga and
               Basil Mustafa and
               Piotr Padlewski and
               Jonathan Heek and
               Justin Gilmer and
               Andreas Steiner and
               Mathilde Caron and
               Robert Geirhos and
               Ibrahim Alabdulmohsin and
               Rodolphe Jenatton and
               Lucas Beyer and
               Michael Tschannen and
               Anurag Arnab and
               Xiao Wang and
               Carlos Riquelme and
               Matthias Minderer and
               Joan Puigcerver and
               Utku Evci and
               Manoj Kumar and
               Sjoerd van Steenkiste and
               Gamaleldin F. Elsayed and
               Aravindh Mahendran and
               Fisher Yu and
               Avital Oliver and
               Fantine Huot and
               Jasmijn Bastings and
               Mark Patrick Collier and
               Alexey A. Gritsenko and
               Vighnesh Birodkar and
               Cristina Vasconcelos and
               Yi Tay and
               Thomas Mensink and
               Alexander Kolesnikov and
               Filip Pavetic and
               Dustin Tran and
               Thomas Kipf and
               Mario Lucic and
               Xiaohua Zhai and
               Daniel Keysers and
               Jeremiah Harmsen and
               Neil Houlsby},
  title     = {Scaling Vision Transformers to 22 Billion Parameters},
  journal   = {CoRR},
  volume    = {abs/2302.05442},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.05442},
  doi       = {10.48550/arXiv.2302.05442},
  eprinttype = {arXiv},
  eprint    = {2302.05442},
  timestamp = {Mon, 13 Feb 2023 14:23:40 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-05442.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@article{DBLP:journals/corr/abs-2207-07411,
  author    = {Dustin Tran and
               Jeremiah Z. Liu and
               Michael W. Dusenberry and
               Du Phan and
               Mark Collier and
               Jie Ren and
               Kehang Han and
               Zi Wang and
               Zelda Mariet and
               Huiyi Hu and
               Neil Band and
               Tim G. J. Rudner and
               Karan Singhal and
               Zachary Nado and
               Joost van Amersfoort and
               Andreas Kirsch and
               Rodolphe Jenatton and
               Nithum Thain and
               Honglin Yuan and
               Kelly Buchanan and
               Kevin Murphy and
               D. Sculley and
               Yarin Gal and
               Zoubin Ghahramani and
               Jasper Snoek and
               Balaji Lakshminarayanan},
  title     = {Plex: Towards Reliability using Pretrained Large Model Extensions},
  journal   = {CoRR},
  volume    = {abs/2207.07411},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2207.07411},
  doi       = {10.48550/arXiv.2207.07411},
  eprinttype = {arXiv},
  eprint    = {2207.07411},
  timestamp = {Thu, 05 Jan 2023 22:22:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2207-07411.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reliability}
}

@inproceedings{DBLP:conf/iclr/WenJMDSLT21,
  author    = {Yeming Wen and
               Ghassen Jerfel and
               Rafael Muller and
               Michael W. Dusenberry and
               Jasper Snoek and
               Balaji Lakshminarayanan and
               Dustin Tran},
  title     = {Combining Ensembles and Data Augmentation Can Harm Your Calibration},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2021},
  url       = {https://openreview.net/forum?id=g11CZSghXyY},
  timestamp = {Wed, 23 Jun 2021 17:36:40 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/WenJMDSLT21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Argumentation}
}

@inproceedings{DBLP:conf/nips/MindererDRHZHTL21,
  author    = {Matthias Minderer and
               Josip Djolonga and
               Rob Romijnders and
               Frances Hubis and
               Xiaohua Zhai and
               Neil Houlsby and
               Dustin Tran and
               Mario Lucic},
  editor    = {Marc'Aurelio Ranzato and
               Alina Beygelzimer and
               Yann N. Dauphin and
               Percy Liang and
               Jennifer Wortman Vaughan},
  title     = {Revisiting the Calibration of Modern Neural Networks},
  booktitle = {NeurIPS},
  pages     = {15682--15694},
  year      = {2021},
  url       = {https://proceedings.neurips.cc/paper/2021/hash/8420d359404024567b5aefda1231af24-Abstract.html},
  timestamp = {Tue, 03 May 2022 16:20:48 +0200},
  biburl    = {https://dblp.org/rec/conf/nips/MindererDRHZHTL21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reliability}
}

@inproceedings{DBLP:conf/nips/KarandikarCTLSM21,
  author    = {Archit Karandikar and
               Nicholas Cain and
               Dustin Tran and
               Balaji Lakshminarayanan and
               Jonathon Shlens and
               Michael C. Mozer and
               Becca Roelofs},
  editor    = {Marc'Aurelio Ranzato and
               Alina Beygelzimer and
               Yann N. Dauphin and
               Percy Liang and
               Jennifer Wortman Vaughan},
  title     = {Soft Calibration Objectives for Neural Networks},
  booktitle = {NeurIPS},
  pages     = {29768--29779},
  year      = {2021},
  url       = {https://proceedings.neurips.cc/paper/2021/hash/f8905bd3df64ace64a68e154ba72f24c-Abstract.html},
  timestamp = {Tue, 03 May 2022 16:20:49 +0200},
  biburl    = {https://dblp.org/rec/conf/nips/KarandikarCTLSM21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reliability}
}

@article{ye2022unreliability,
  title={The unreliability of explanations in few-shot prompting for textual reasoning},
  author={Ye, Xi and Durrett, Greg},
  journal={NeurIPS},
  year={2022},
  url={https://par.nsf.gov/biblio/10380030},
  keywords={Prompt Engineering, Reasoning}
}

@inproceedings{DBLP:conf/iclr/PoesiaP00SMG22,
  author    = {Gabriel Poesia and
               Alex Polozov and
               Vu Le and
               Ashish Tiwari and
               Gustavo Soares and
               Christopher Meek and
               Sumit Gulwani},
  title     = {Synchromesh: Reliable Code Generation from Pre-trained Language Models},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2022},
  url       = {https://openreview.net/forum?id=KmtVD97J43e},
  timestamp = {Sat, 20 Aug 2022 01:15:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/PoesiaP00SMG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Program and Code Generation, Reliability}
}

@inproceedings{DBLP:conf/emnlp/WangLXZZ21,
  author    = {Shuohang Wang and
               Yang Liu and
               Yichong Xu and
               Chenguang Zhu and
               Michael Zeng},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Want To Reduce Labeling Cost? {GPT-3} Can Help},
  booktitle = {EMNLP Findings},
  pages     = {4195--4205},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-emnlp.354},
  doi       = {10.18653/v1/2021.findings-emnlp.354},
  timestamp = {Fri, 13 May 2022 11:42:33 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/WangLXZZ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Annotation}
}

@article{DBLP:journals/corr/abs-2212-10450,
  author    = {Bosheng Ding and
               Chengwei Qin and
               Linlin Liu and
               Lidong Bing and
               Shafiq R. Joty and
               Boyang Li},
  title     = {Is {GPT-3} a Good Data Annotator?},
  journal   = {CoRR},
  volume    = {abs/2212.10450},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10450},
  doi       = {10.48550/arXiv.2212.10450},
  eprinttype = {arXiv},
  eprint    = {2212.10450},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10450.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Annotation}
}

@article{DBLP:journals/corr/abs-2212-10529,
  author    = {Xingxuan Li and
               Yutong Li and
               Linlin Liu and
               Lidong Bing and
               Shafiq R. Joty},
  title     = {Is {GPT-3} a Psychopath? Evaluating Large Language Models from a Psychological
               Perspective},
  journal   = {CoRR},
  volume    = {abs/2212.10529},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10529},
  doi       = {10.48550/arXiv.2212.10529},
  eprinttype = {arXiv},
  eprint    = {2212.10529},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10529.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation}
}

@article{DBLP:journals/corr/abs-2302-02094,
  author    = {Paula Maddigan and
               Teo Susnjak},
  title     = {Chat2VIS: Generating Data Visualisations via Natural Language using
               ChatGPT, Codex and {GPT-3} Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2302.02094},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.02094},
  doi       = {10.48550/arXiv.2302.02094},
  eprinttype = {arXiv},
  eprint    = {2302.02094},
  timestamp = {Fri, 10 Feb 2023 12:26:39 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-02094.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Visualisation}
}

@inproceedings{DBLP:conf/acl/LiuLHC022,
  author    = {Fangchao Liu and
               Hongyu Lin and
               Xianpei Han and
               Boxi Cao and
               Le Sun},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Pre-training to Match for Unified Low-shot Relation Extraction},
  booktitle = {ACL},
  pages     = {5785--5795},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.397},
  doi       = {10.18653/v1/2022.acl-long.397},
  timestamp = {Mon, 01 Aug 2022 16:27:47 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/LiuLHC022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Relation Extraction}
}

@inproceedings{DBLP:conf/acl/JieLL22,
  author    = {Zhanming Jie and
               Jierui Li and
               Wei Lu},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Learning to Reason Deductively: Math Word Problem Solving as Complex
               Relation Extraction},
  booktitle = {ACL},
  pages     = {5944--5955},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.410},
  doi       = {10.18653/v1/2022.acl-long.410},
  timestamp = {Mon, 01 Aug 2022 16:27:49 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/JieLL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Relation Extraction}
}

@inproceedings{DBLP:conf/acl/PapalucaKSL22,
  author    = {Andrea Papaluca and
               Daniel Krefl and
               Hanna Suominen and
               Artem Lenskiy},
  editor    = {Samuel Louvan and
               Andrea Madotto and
               Brielen Madureira},
  title     = {Pretrained Knowledge Base Embeddings for improved Sentential Relation
               Extraction},
  booktitle = {ACL},
  pages     = {373--382},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-srw.29},
  doi       = {10.18653/v1/2022.acl-srw.29},
  timestamp = {Mon, 01 Aug 2022 16:27:52 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/PapalucaKSL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Relation Extraction}
}

@inproceedings{DBLP:conf/bionlp/GiorgiBW22,
  author    = {John M. Giorgi and
               Gary D. Bader and
               Bo Wang},
  editor    = {Dina Demner{-}Fushman and
               Kevin Bretonnel Cohen and
               Sophia Ananiadou and
               Junichi Tsujii},
  title     = {A sequence-to-sequence approach for document-level relation extraction},
  booktitle = {ACL},
  pages     = {10--25},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.bionlp-1.2},
  doi       = {10.18653/v1/2022.bionlp-1.2},
  timestamp = {Mon, 01 Aug 2022 16:27:55 +0200},
  biburl    = {https://dblp.org/rec/conf/bionlp/GiorgiBW22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Relation Extraction}
}

@inproceedings{DBLP:conf/bionlp/IinumaMS22,
  author    = {Naoki Iinuma and
               Makoto Miwa and
               Yutaka Sasaki},
  editor    = {Dina Demner{-}Fushman and
               Kevin Bretonnel Cohen and
               Sophia Ananiadou and
               Junichi Tsujii},
  title     = {Improving Supervised Drug-Protein Relation Extraction with Distantly
               Supervised Models},
  booktitle = {ACL},
  pages     = {161--170},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.bionlp-1.16},
  doi       = {10.18653/v1/2022.bionlp-1.16},
  timestamp = {Mon, 01 Aug 2022 16:27:54 +0200},
  biburl    = {https://dblp.org/rec/conf/bionlp/IinumaMS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Relation Extraction}
}

@inproceedings{DBLP:conf/bionlp/SarroutiTR22,
  author    = {Mourad Sarrouti and
               Carson Tao and
               Yoann Mamy Randriamihaja},
  editor    = {Dina Demner{-}Fushman and
               Kevin Bretonnel Cohen and
               Sophia Ananiadou and
               Junichi Tsujii},
  title     = {Comparing Encoder-Only and Encoder-Decoder Transformers for Relation
               Extraction from Biomedical Texts: An Empirical Study on Ten Benchmark
               Datasets},
  booktitle = {ACL},
  pages     = {376--382},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.bionlp-1.37},
  doi       = {10.18653/v1/2022.bionlp-1.37},
  timestamp = {Mon, 01 Aug 2022 16:27:54 +0200},
  biburl    = {https://dblp.org/rec/conf/bionlp/SarroutiTR22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Relation Extraction}
}

@article{DBLP:journals:corr:abs-2212-10559,
  author    = {Damai Dai and
               Yutao Sun and
               Li Dong and
               Yaru Hao and
               Zhifang Sui and
               Furu Wei},
  title     = {Why Can {GPT} Learn In-Context? Language Models Secretly Perform Gradient
               Descent as Meta-Optimizers},
  journal   = {CoRR},
  volume    = {abs/2212.10559},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10559},
  doi       = {10.48550/arXiv.2212.10559},
  eprinttype = {arXiv},
  eprint    = {2212.10559},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10559.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning},
}
@String(DBLP:journals:corr:abs-2212-10559="(1) 与The Dual Form of Neural Networks Revisited结合一起看，可以进一步理解in-context learning，通过与NN线性层对偶形式的类比，可以将ICL流程描述为：1. 基于Transformer的预训练语言模型作为元优化器；2. 通过正向计算，根据示范例子产生元梯度；3. 通过关注，将元梯度应用于原始语言模型，建立一个ICL模型；
(2)与Fine-tune类似，ICL也是在zero-shot learning参数的基础上，提供了一个更新量。")

@article{DBLP:journals/corr/abs-2302-07459,
  author    = {Deep Ganguli and
               Amanda Askell and
               Nicholas Schiefer and
               Thomas I. Liao and
               Kamile Lukosiute and
               Anna Chen and
               Anna Goldie and
               Azalia Mirhoseini and
               Catherine Olsson and
               Danny Hernandez and
               Dawn Drain and
               Dustin Li and
               Eli Tran{-}Johnson and
               Ethan Perez and
               Jackson Kernion and
               Jamie Kerr and
               Jared Mueller and
               Joshua Landau and
               Kamal Ndousse and
               Karina Nguyen and
               Liane Lovitt and
               Michael Sellitto and
               Nelson Elhage and
               Noem{\'{\i}} Mercado and
               Nova DasSarma and
               Oliver Rausch and
               Robert Lasenby and
               Robin Larson and
               Sam Ringer and
               Sandipan Kundu and
               Saurav Kadavath and
               Scott Johnston and
               Shauna Kravec and
               Sheer El Showk and
               Tamera Lanham and
               Timothy Telleen{-}Lawton and
               Tom Henighan and
               Tristan Hume and
               Yuntao Bai and
               Zac Hatfield{-}Dodds and
               Ben Mann and
               Dario Amodei and
               Nicholas Joseph and
               Sam McCandlish and
               Tom Brown and
               Christopher Olah and
               Jack Clark and
               Samuel R. Bowman and
               Jared Kaplan},
  title     = {The Capacity for Moral Self-Correction in Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2302.07459},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.07459},
  doi       = {10.48550/arXiv.2302.07459},
  eprinttype = {arXiv},
  eprint    = {2302.07459},
  timestamp = {Thu, 23 Feb 2023 10:18:51 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-07459.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Instruction Tuning, RLHF}
}

@article{DBLP:journals/corr/abs-2302-10205,
  author    = {Xiang Wei and
               Xingyu Cui and
               Ning Cheng and
               Xiaobin Wang and
               Xin Zhang and
               Shen Huang and
               Pengjun Xie and
               Jinan Xu and
               Yufeng Chen and
               Meishan Zhang and
               Yong Jiang and
               Wenjuan Han},
  title     = {Zero-Shot Information Extraction via Chatting with ChatGPT},
  journal   = {CoRR},
  volume    = {abs/2302.10205},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.10205},
  doi       = {10.48550/arXiv.2302.10205},
  eprinttype = {arXiv},
  eprint    = {2302.10205},
  timestamp = {Thu, 23 Feb 2023 16:02:44 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-10205.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Information Extraction}
}

@article{DBLP:journals/corr/abs-2302-09419,
  author    = {Ce Zhou and
               Qian Li and
               Chen Li and
               Jun Yu and
               Yixin Liu and
               Guangjing Wang and
               Kai Zhang and
               Cheng Ji and
               Qiben Yan and
               Lifang He and
               Hao Peng and
               Jianxin Li and
               Jia Wu and
               Ziwei Liu and
               Pengtao Xie and
               Caiming Xiong and
               Jian Pei and
               Philip S. Yu and
               Lichao Sun},
  title     = {A Comprehensive Survey on Pretrained Foundation Models: {A} History
               from {BERT} to ChatGPT},
  journal   = {CoRR},
  volume    = {abs/2302.09419},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.09419},
  doi       = {10.48550/arXiv.2302.09419},
  eprinttype = {arXiv},
  eprint    = {2302.09419},
  timestamp = {Thu, 23 Feb 2023 16:02:44 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-09419.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey}
}

@article{DBLP:journals/corr/abs-2302-06466,
  author    = {Reham Omar and
               Omij Mangukiya and
               Panos Kalnis and
               Essam Mansour},
  title     = {ChatGPT versus Traditional Question Answering for Knowledge Graphs:
               Current Status and Future Directions Towards Knowledge Graph Chatbots},
  journal   = {CoRR},
  volume    = {abs/2302.06466},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.06466},
  doi       = {10.48550/arXiv.2302.06466},
  eprinttype = {arXiv},
  eprint    = {2302.06466},
  timestamp = {Mon, 20 Feb 2023 14:27:28 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-06466.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Question Answering, Evaluation}
}

@article{kung2023performance,
  title={Performance of ChatGPT on USMLE: Potential for AI-assisted medical education using large language models},
  author={Kung, Tiffany H and Cheatham, Morgan and Medenilla, Arielle and Sillos, Czarina and De Leon, Lorie and Elepa{\~n}o, Camille and Madriaga, Maria and Aggabao, Rimel and Diaz-Candido, Giezel and Maningo, James and others},
  journal={PLOS Digital Health},
  volume={2},
  number={2},
  pages={e0000198},
  year={2023},
  publisher={Public Library of Science},
  url={https://journals.plos.org/digitalhealth/article?id=10.1371/journal.pdig.0000198&trk=public_post_comment-text},
  keywords={Application}
}

@misc{mbakwe2023chatgpt,
  title={ChatGPT passing USMLE shines a spotlight on the flaws of medical education},
  author={Mbakwe, Amarachi B and Lourentzou, Ismini and Celi, Leo Anthony and Mechanic, Oren J and Dagan, Alon},
  journal={PLOS Digital Health},
  volume={2},
  number={2},
  pages={e0000205},
  year={2023},
  publisher={Public Library of Science San Francisco, CA USA},
  keywords={Application},
  url={https://journals.plos.org/digitalhealth/article?id=10.1371/journal.pdig.0000205}
}

@inproceedings{DBLP:conf/iclr/ClarkLLM20,
  author    = {Kevin Clark and
               Minh{-}Thang Luong and
               Quoc V. Le and
               Christopher D. Manning},
  title     = {{ELECTRA:} Pre-training Text Encoders as Discriminators Rather Than
               Generators},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2020},
  url       = {https://openreview.net/forum?id=r1xMH1BtvB},
  timestamp = {Thu, 07 May 2020 17:11:48 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/ClarkLLM20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  plm={ELECTRA},
  keywords={Pre-Training Techniques}
}

@inproceedings{DBLP:conf/naacl/DevlinCLT19,
  author    = {Jacob Devlin and
               Ming{-}Wei Chang and
               Kenton Lee and
               Kristina Toutanova},
  editor    = {Jill Burstein and
               Christy Doran and
               Thamar Solorio},
  title     = {{BERT:} Pre-training of Deep Bidirectional Transformers for Language
               Understanding},
  booktitle = {NAACL},
  pages     = {4171--4186},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/n19-1423},
  doi       = {10.18653/v1/n19-1423},
  timestamp = {Mon, 26 Sep 2022 12:21:55 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/DevlinCLT19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  plm={BERT},
  keywords={Pre-Training Techniques }
}

@article{DBLP:journals/corr/abs-1907-11692,
  author    = {Yinhan Liu and
               Myle Ott and
               Naman Goyal and
               Jingfei Du and
               Mandar Joshi and
               Danqi Chen and
               Omer Levy and
               Mike Lewis and
               Luke Zettlemoyer and
               Veselin Stoyanov},
  title     = {RoBERTa: {A} Robustly Optimized {BERT} Pretraining Approach},
  journal   = {CoRR},
  volume    = {abs/1907.11692},
  year      = {2019},
  url       = {http://arxiv.org/abs/1907.11692},
  eprinttype = {arXiv},
  eprint    = {1907.11692},
  timestamp = {Thu, 01 Aug 2019 08:59:33 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1907-11692.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques},
  plm = {RoBERTa}
}

@inproceedings{DBLP:conf/emnlp/CuiC000H20,
  author    = {Yiming Cui and
               Wanxiang Che and
               Ting Liu and
               Bing Qin and
               Shijin Wang and
               Guoping Hu},
  editor    = {Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Revisiting Pre-Trained Models for Chinese Natural Language Processing},
  booktitle = {EMNLP Findings},
  series    = {ACL Findings},
  volume    = {{EMNLP} 2020},
  pages     = {657--668},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.58},
  doi       = {10.18653/v1/2020.findings-emnlp.58},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/CuiC000H20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques}
}


// from Wu Tongtong

@inproceedings{KeLMXS21,
  author    = {Zixuan Ke and
               Bing Liu and
               Nianzu Ma and
               Hu Xu and
               Lei Shu},
  title     = {Achieving Forgetting Prevention and Knowledge Transfer in Continual
               Learning},
  booktitle = {Proceedings of NeurIPS},
  pages     = {22443--22456},
  year      = {2021},
  url       = {https://proceedings.neurips.cc/paper/2021/hash/bcd0049c35799cdf57d06eaf2eb3cff6-Abstract.html},
  keywords={Continual Learning}
}
@String(KeLMXS21="NeurIPS 2021, The key component of CTR is the CL-plugin inserted in BERT. A CL-plugin is a capsule network with a new transfer routing mechanism to encourage knowledge transfer among tasks and also to isolate task-specific knowledge to avoid forgetting.")

@inproceedings{jin-etal-2021-learn-continually,
    title = "Learn Continually, Generalize Rapidly: Lifelong Knowledge Accumulation for Few-shot Learning",
    author = "Jin, Xisen  and
      Lin, Bill Yuchen  and
      Rostami, Mohammad  and
      Ren, Xiang",
    booktitle = "EMNLP Findings",
    year = "2021",
    url = "https://aclanthology.org/2021.findings-emnlp.62",
    pages = "714--729",
    keywords={Continual Learning}
}
@String(jin-etal-2021-learn-continually="We present a new learning setup, Continual Learning of Few-Shot Learners, to address challenges of both learning settings in a unified setup, with a hyper-network for task-specific adapter generation.")

@inproceedings{HeLCOLGP21,
  author    = {Tianxing He and
               Jun Liu and
               Kyunghyun Cho and
               Myle Ott and
               Bing Liu and
               James R. Glass and
               Fuchun Peng},
  title     = {Analyzing the Forgetting Problem in Pretrain-Finetuning of Open-domain
               Dialogue Response Models},
  booktitle = {Proceedings of EACL},
  pages     = {1121--1133},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.eacl-main.95},
  keywords={Continual Learning}
}
@String(HeLCOLGP21="Our major finding is that after standard finetuning, the model forgets some of the important language generation skills acquired during large-scale pretraining. We propose an intuitive finetuning strategy named “mix-review”: : For each finetuning epoch, we mix the target dialogue data with a random subset of the pretraining data, mix_ratio is 4, decay is 0.9.")

@inproceedings{WangTDWHJCJZ21,
  author    = {Ruize Wang and
               Duyu Tang and
               Nan Duan and
               Zhongyu Wei and
               Xuanjing Huang and
               Jianshu Ji and
               Guihong Cao and
               Daxin Jiang and
               Ming Zhou},
  title     = {K-Adapter: Infusing Knowledge into Pre-Trained Models with Adapters},
  booktitle = {ACL Findings},
  pages     = {1405--1418},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.121},
  keywords={Continual Learning}
}
@String(WangTDWHJCJZ21="We propose KADAPTER, a framework that retains the original parameters of the pre-trained model fixed
and supports the development of versatile
knowledge-infused model.")

@inproceedings{ChenHCCLY20,
  author    = {Sanyuan Chen and
               Yutai Hou and
               Yiming Cui and
               Wanxiang Che and
               Ting Liu and
               Xiangzhan Yu},
  title     = {Recall and Learn: Fine-tuning Deep Pretrained Language Models with
               Less Forgetting},
  booktitle = {Proceedings of EMNLP},
  pages     = {7870--7881},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.634},
  keywords={Continual Learning}
}
@String(ChenHCCLY20="We propose a recall and learn mechanism, which adopts the idea of multi-task learning and jointly learns pretraining tasks and downstream tasks. Specifically, we introduce a Pretraining Simulation mechanism to recall the knowledge from pretraining tasks without data, and an Objective Shifting mechanism to focus the learning on downstream tasks gradually.")

@inproceedings{
qin2022lfpt,
title={{LFPT}5: A Unified Framework for Lifelong Few-shot Language Learning Based on Prompt Tuning of T5},
author={Chengwei Qin and Shafiq Joty},
booktitle={Proceedings of ICLR},
year={2022},
url={https://openreview.net/forum?id=HCRVf71PMF},
keywords={Continual Learning}
}
@String(qin2022lfpt="We define a challenging yet practical problem as Lifelong Few-shot Language Learning and propose a unified framework for it based on prompt tuning of T5.")

@inproceedings{jang2022towards,
title={Towards Continual Knowledge Learning of Language Models},
author={Joel Jang and Seonghyeon Ye and Sohee Yang and Joongbo Shin and Janghoon Han and Gyeonghun KIM and Stanley Jungkyu Choi and Minjoon Seo},
booktitle={Proceedings of ICLR},
year={2022},
url={https://openreview.net/forum?id=vfsRB5MImo9},
keywords={Continual Learning}
}
@String(jang2022towards="We propose a novel continual learning formulation named Continual Knowledge Learning which allows large language models to constantly obtain new and updated knowledge while mitigating forgetting of previous learned time-invariant knowledge.")

@inproceedings{
wu2022pretrained,
title={Pretrained Language Model in Continual Learning: A Comparative Study},
author={Tongtong Wu and Massimo Caccia and Zhuang Li and Yuan-Fang Li and Guilin Qi and Gholamreza Haffari},
booktitle={Proceedings of ICLR},
year={2022},
url={https://openreview.net/forum?id=figzpGMrdD},
keywords={Continual Learning}
}
@String(wu2022pretrained="To explore the layer-wise property of pretrained languge models in continual learning, we thoroughly compare the continual learning performance over the combination of 5 PLMs and 4 veins of CL methods on 3 benchmarks in 2 typical incremental settings.")

@inproceedings{liu-etal-2021-domain,
    title = "Domain-Lifelong Learning for Dialogue State Tracking via Knowledge Preservation Networks",
    author = "Liu, Qingbin  and
      Cao, Pengfei  and
      Liu, Cao  and
      Chen, Jiansong  and
      Cai, Xunliang  and
      Yang, Fan  and
      He, Shizhu  and
      Liu, Kang  and
      Zhao, Jun",
    booktitle = "Proceedings of EMNLP",
    year = "2021",
    url = "https://aclanthology.org/2021.emnlp-main.176",
    pages = "2301--2311",
    keywords={Continual Learning}
}
@String(liu-etal-2021-domain="This paper explores Domain-Lifelong Learning for Dialogue State Tracking, we propose Knowledge Preservation Network, which consists of multi-prototype enhanced retrospection and multi-strategy knowledge distillation, to solve the problems of expression diversity and combinatorial explosion in the DLL-DST task")

@inproceedings{ke-etal-2021-classic,
    title = "{CLASSIC}: Continual and Contrastive Learning of Aspect Sentiment Classification Tasks",
    author = "Ke, Zixuan  and
      Liu, Bing  and
      Xu, Hu  and
      Shu, Lei",
    booktitle = "Proceedings of EMNLP",
    year = "2021",
    url = "https://aclanthology.org/2021.emnlp-main.550",
    pages = "6871--6883",
    keywords={Continual Learning}
}
@String(ke-etal-2021-classic="The key novelty is a contrastive continual learning method that enables both knowledge transfer across tasks and knowledge distillation from old tasks to the new task, which eliminates the need for task ids in testing.")

@inproceedings{situ-etal-2021-lifelong,
    title = "Lifelong Explainer for Lifelong Learners",
    author = "Situ, Xuelin  and
      Maruf, Sameen  and
      Zukerman, Ingrid  and
      Paris, Cecile  and
      Haffari, Gholamreza",
    booktitle = "Proceedings of EMNLP",
    year = "2021",
    url = "https://aclanthology.org/2021.emnlp-main.233",
    pages = "2933--2940",
    keywords={Continual Learning}
}
@String(situ-etal-2021-lifelong="We propose a novel Lifelong Explanation approach that continuously trains a student explainer under the supervision of a teacher – an arbitrary explanation algorithm – on different tasks undertaken in LL. We also leverage the Experience Replay mechanism to prevent catastrophic forgetting in the student explainer.")

@inproceedings{ZhaoNLJCM21,
  author    = {Yingzhu Zhao and
               Chongjia Ni and
               Cheung{-}Chi Leung and
               Shafiq R. Joty and
               Eng Siong Chng and
               Bin Ma},
  title     = {A Unified Speaker Adaptation Approach for {ASR}},
  booktitle = {Proceedings of EMNLP},
  pages     = {9339--9349},
  year      = {2021},
  url       = {https://aclanthology.org/2021.emnlp-main.737},
  keywords={Continual Learning}
}
@String(ZhaoNLJCM21="Prefix-based user identifier, Continual ASR / Architecture Search / Network Pruning.")

@inproceedings{3447548.3467162,
  author    = {Amba Hombaiah, Spurthi and Chen, Tao and Zhang, Mingyang and Bendersky, Michael and Najork, Marc},
  title     = {Dynamic Language Models for Continuously Evolving Content},
  year      = {2021},
  url       = {https://doi.org/10.1145/3447548.3467162},
  booktitle = {Proceedings of SIGKDD},
  pages     = {2514–2524},
  keywords={Continual Learning}
}
@String(3447548.3467162="We propose a simple yet effective algorithm to tackle the problem of OOV new tokens and sub-optimal tokenization. Finally, we propose three effective sampling methods to detect the training examples which contain updated knowledge and use these examples to enable efficient incremental training.")

@inproceedings{guo-etal-2021-parameter,
  title     = {Parameter-Efficient Transfer Learning with Diff Pruning},
  author    = {Guo, Demi  and
      Rush, Alexander  and
      Kim, Yoon},
  booktitle = {Proceedings of ACL},
  year      = {2021},
  url       = {https://aclanthology.org/2021.acl-long.378},
  pages     = {4884--4896},
  keywords={Continual Learning}
}
@String(guo-etal-2021-parameter="The approach learns a task-specific “diff” vector that extends the original pretrained parameters. As the number of tasks increases, diff pruning remains parameter-efficient, as it requires storing only a small diff vector for each task.")

@inproceedings{cui-etal-2021-refining,
  title     = {Refining Sample Embeddings with Relation Prototypes to Enhance Continual Relation Extraction},
  author    = {Cui, Li  and
      Yang, Deqing  and
      Yu, Jiaxin  and
      Hu, Chengwei  and
      Cheng, Jiayang  and
      Yi, Jingjie  and
      Xiao, Yanghua},
  booktitle = {Proceedings of ACL},
  year      = {2021},
  url       = {https://aclanthology.org/2021.acl-long.20},
  pages     = {232--243},
  keywords={Continual Learning}
}
@String(cui-etal-2021-refining="To fully utilize memorized samples, in this paper, we employ relation prototype to extract useful information of each relation. ")


@inproceedings{he-etal-2021-effectiveness,
  title     = {On the Effectiveness of Adapter-based Tuning for Pretrained Language Model Adaptation},
  author    = {He, Ruidan  and
      Liu, Linlin  and
      Ye, Hai  and
      Tan, Qingyu  and
      Ding, Bosheng  and
      Cheng, Liying  and
      Low, Jiawei  and
      Bing, Lidong  and
      Si, Luo},
  booktitle = {Proceedings of ACL},
  year      = {2021},
  url       = {https://aclanthology.org/2021.acl-long.172},
  pages     = {2208--2222},
  keywords={Continual Learning}
}
@String(he-etal-2021-effectiveness="we first show that adapter-based tuning better mitigates forgetting issues than fine-tuning since it yields representations with less deviation from those generated by the initial PrLM. Effectiveness: it tendsto outperform fine-tuning on both low-resource and cross-lingual tasks; 2 it demonstrates higher stability under different learning rates compared to fine-tuning.")

@inproceedings{kanwatchara-etal-2021-rational,
  title     = {Rational {LAMOL}: A Rationale-based Lifelong Learning Framework},
  author    = {Kanwatchara, Kasidis  and
      Horsuwan, Thanapapas  and
      Lertvittayakumjorn, Piyawat  and
      Kijsirikul, Boonserm  and
      Vateekul, Peerapon},
  booktitle = {Proceedings of ACL},
  year      = {2021},
  url       = {https://aclanthology.org/2021.acl-long.229},
  pages     = {2942--2953},
  keywords={Continual Learning}
}
@String(kanwatchara-etal-2021-rational="Rational LAMOL enhances LAMOL, a recent LL model, by applying critical freezing guided by human rationales. When the human rationales are not available, we propose exploiting unsupervised generated rationales as substitutions.")

@inproceedings{LinMF20,
  author    = {Zhaojiang Lin and
               Andrea Madotto and
               Pascale Fung},
  title     = {Exploring Versatile Generative Language Model Via Parameter-Efficient
               Transfer Learning},
  booktitle = {EMNLP Findings},
  pages     = {441--459},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.41},
  keywords={Continual Learning}
}
@String(LinMF20="Proposing an adapter-based method for continual learning in text generation. One of the insights is a frozen PLM can be well-applied in continual learning.")

@inproceedings{arumae-etal-2020-empirical,
  title     = {An Empirical Investigation Towards Efficient Multi-Domain Language Model Pre-training},
  author    = {Arumae, Kristjan  and
      Sun, Qing  and
      Bhatia, Parminder},
  booktitle = {Proceedings of EMNLP},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.emnlp-main.394},
  pages     = {4854--4864},
  keywords={Continual Learning}
}
@String(arumae-etal-2020-empirical="We find that elastic weight consolidation provides best overall scores yielding only a 0.33% drop in performance across seven generic tasks while remaining competitive in bio-medical tasks.")

@inproceedings{garcia-etal-2021-towards,
  title     = {Towards Continual Learning for Multilingual Machine Translation via Vocabulary Substitution},
  author    = {Garcia, Xavier  and
      Constant, Noah  and
      Parikh, Ankur  and
      Firat, Orhan},
  booktitle = {Proceedings of NAACL-HLT},
  year      = {2021},
  url       = {https://www.aclweb.org/anthology/2021.naacl-main.93},
  pages     = {1184--1192},
  keywords={Continual Learning}
}
@String( garcia-etal-2021-towards = "Introducing the catastrophic forgetting problem in incremental multi-language translation, and utilizing a vocabulary substitution manner to alleviate the above problem." )

@inproceedings{huang-etal-2021-continual,
  title     = {Continual Learning for Text Classification with Information Disentanglement Based Regularization},
  author    = {Huang, Yufan  and
      Zhang, Yanzhe  and
      Chen, Jiaao  and
      Wang, Xuezhi  and
      Yang, Diyi},
  booktitle = {Proceedings of NAACL-HLT},
  year      = {2021},
  url       = {https://www.aclweb.org/anthology/2021.naacl-main.218},
  pages     = {2736--2746},
  keywords={Continual Learning}
}
@String( huang-etal-2021-continual = "Proposing a regularization-based method for continual text classification, introducing the next sentence prediction and task id prediction as auxiliary tasks." )

@inproceedings{xia-etal-2021-incremental,
  title     = {Incremental Few-shot Text Classification with Multi-round New Classes: Formulation, Dataset and System},
  author    = {Xia, Congying  and
      Yin, Wenpeng  and
      Feng, Yihao  and
      Yu, Philip},
  booktitle = {Proceedings of NAACL-HLT},
  year      = {2021},
  url       = {https://www.aclweb.org/anthology/2021.naacl-main.106},
  pages     = {1351--1360},
  keywords={Continual Learning}
}
@String( xia-etal-2021-incremental = "Proposing a new setting and respective benchmark for few-shot incremental text classification, modeling continual text classification with text entailment." )

@inproceedings{hua-etal-2021-hyperparameter,
  title     = {Hyperparameter-free Continuous Learning for Domain Classification in Natural Language Understanding},
  author    = {Hua, Ting  and
      Shen, Yilin  and
      Zhao, Changsheng  and
      Hsu, Yen-Chang  and
      Jin, Hongxia},
  booktitle = {Proceedings of NAACL-HLT},
  year      = {2021},
  url       = {https://www.aclweb.org/anthology/2021.naacl-main.212},
  pages     = {2669--2678},
  keywords={Continual Learning}
}
@String( hua-etal-2021-hyperparameter = "Inspired by EWC and proposing a hyperparameter-free (Fisher information-based) sampling method for memory replay." )

@inproceedings{vijayaraghavan-roy-2021-lifelong,
  title     = {Lifelong Knowledge-Enriched Social Event Representation Learning},
  author    = {Vijayaraghavan, Prashanth  and
      Roy, Deb},
  booktitle = {Proceedings of EACL},
  year      = {2021},
  url       = {https://www.aclweb.org/anthology/2021.eacl-main.317},
  pages     = {3624--3635},
  keywords={Continual Learning}
}
@String(vijayaraghavan-roy-2021-lifelong="Proposing a rehearsal-based method, i.e.,Domain-Representative Episodic Memory Replay (DR-EMR), for lifelong event representation with embedding alignment and external social commonsense knowledge.")

@inproceedings{jin-etal-2020-visually,
  title     = {Visually Grounded Continual Learning of Compositional Phrases},
  author    = {Jin, Xisen  and
      Du, Junyi  and
      Sadhu, Arka  and
      Nevatia, Ram  and
      Ren, Xiang},
  booktitle = {Proceedings of EMNLP},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.emnlp-main.158},
  doi       = {10.18653/v1/2020.emnlp-main.158},
  pages     = {2018--2029},
  keywords={Continual Learning}
}
@String( jin-etal-2020-visually = "A novel continual learning setting and a new benchmark for continual caption generation, evaluated with exiting rehearsal-based methods" )

@inproceedings{cao-etal-2020-incremental,
  title     = {Incremental Event Detection via Knowledge Consolidation Networks},
  author    = {Cao, Pengfei  and
      Chen, Yubo  and
      Zhao, Jun  and
      Wang, Taifeng},
  booktitle = {Proceedings of EMNLP},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.emnlp-main.52},
  doi       = {10.18653/v1/2020.emnlp-main.52},
  pages     = {707--717},
  keywords={Continual Learning}
}
@String( cao-etal-2020-incremental = "Proposing a hybrid continual learning method for event detection, combining experience replay and Knowledge Distillation, focusing on (1) semantic ambiguity in NLP and (2) data imbalance between memory and current task." )

@inproceedings{dai-etal-2020-multi,
  title     = {A Multi-Task Incremental Learning Framework with Category Name Embedding for Aspect-Category Sentiment Analysis},
  author    = {Dai, Zehui  and
      Peng, Cheng  and
      Chen, Huajie  and
      Ding, Yadong},
  booktitle = {Proceedings of EMNLP},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.emnlp-main.565},
  doi       = {10.18653/v1/2020.emnlp-main.565},
  pages     = {6955--6965},
  keywords={Continual Learning}
}
@String( dai-etal-2020-multi = "Utilizing BERT for sentence and category encoding, preserving category encoding to prevent catastrophic forgetting." )

@inproceedings{wang-etal-2020-efficient,
  title     = {Efficient Meta Lifelong-Learning with Limited Memory},
  author    = {Wang, Zirui  and
      Mehta, Sanket Vaibhav  and
      Poczos, Barnabas  and
      Carbonell, Jaime},
  booktitle = {Proceedings of EMNLP},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.emnlp-main.39},
  doi       = {10.18653/v1/2020.emnlp-main.39},
  pages     = {535--548},
  keywords={Continual Learning}
}
@String( wang-etal-2020-efficient = "A meta learning-enhanced version of MbPA (NeurIPS19), sharing the continual setting as well. Figure 1 is interesting." )

@inproceedings{chuang-etal-2020-lifelong,
  title     = {Lifelong Language Knowledge Distillation},
  author    = {Chuang, Yung-Sung  and
      Su, Shang-Yu  and
      Chen, Yun-Nung},
  booktitle = {Proceedings of EMNLP},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.emnlp-main.233},
  doi       = {10.18653/v1/2020.emnlp-main.233},
  pages     = {2914--2924},
  keywords={Continual Learning}
}
@String( chuang-etal-2020-lifelong = "Proposing a Knowledge Distillation-enhanced Method LLL based on LAMOL (ICLR 2020) model for continual learning, evaluated on text generation and text classification." )

@inproceedings{sun-etal-2020-distill,
  title     = {Distill and Replay for Continual Language Learning},
  author    = {Sun, Jingyuan  and
      Wang, Shaonan  and
      Zhang, Jiajun  and
      Zong, Chengqing},
  booktitle = {Proceedings of COLING},
  year      = {2020},
  url       = {https://www.aclweb.org/anthology/2020.coling-main.318},
  doi       = {10.18653/v1/2020.coling-main.318},
  pages     = {3569--3579},
  keywords={Continual Learning}
}
@String(sun-etal-2020-distill="Proposing a distill and replay method (DnR) which follows the setting of LAMOL. As a distillation-based method, DnR also shows the ability in incrementally compressing the model size while still outperforming most of the baselines.")

@inproceedings{dAutumeRKY19,
  author    = {Cyprien de Masson d'Autume and
 Sebastian Ruder and
 Lingpeng Kong and
 Dani Yogatama},
  title     = {Episodic Memory in Lifelong Language Learning},
  booktitle = {Proceedings of NeurIPS},
  pages     = {13122--13131},
  year      = {2019},
  url       = {https://proceedings.neurips.cc/paper/2019/hash/f8d2e80c1458ea2501f98a2cafadb397-Abstract.html},
  keywords={Continual Learning}
}
@String(dAutumeRKY19="MbPA++. This paper proposes the use of memory (a fixed memory network) in life-long learning to prevent catastrophic forgetting by means of  experience replay and local adaptation. ")

@inproceedings{Sun_Wang_Li_Feng_Tian_Wu_Wang_2020,
  title     = {ERNIE 2.0: A Continual Pre-Training Framework for Language Understanding},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/6428},
  doi       = {10.1609/aaai.v34i05.6428},
  booktitle = {Proceedings of AAAI},
  author    = {Sun, Yu and Wang, Shuohuan and Li, Yukun and Feng, Shikun and Tian, Hao and Wu, Hua and Wang, Haifeng},
  year      = {2020},
  pages     = {8968-8975},
  keywords={Continual Learning}
}
@String(Sun_Wang_Li_Feng_Tian_Wu_Wang_2020="In order to extract the lexical, syntactic and semantic information from training corpora, we propose a continual pre-training framework named ERNIE 2.0 which incrementally builds pre-training tasks and then learn pre-trained models on these constructed tasks via continual multi-task learning.")

@article{abs-2105-13880,
  author   = {Yujia Qin and
 Yankai Lin and
 Jing Yi and
 Jiajie Zhang and
 Xu Han and
 Zhengyan Zhang and
 YuSheng Su and
 Zhiyuan Liu and
 Peng Li and
 Maosong Sun and
 Jie Zhou},
  title    = {Knowledge Inheritance for Pre-trained Language Models},
  journal  = {CoRR},
  volume   = {abs/2105.13880},
  year     = {2021},
  url      = {https://arxiv.org/abs/2105.13880},
 keywords={Continual Learning}
@String(abs-2105-13880=", we explore the question that how can previously trained PLMs benefit training larger PLMs in future. Specifically, we introduce a novel pre-training framework named “knowledge inheritance” (KI), which combines both self-learning and teacher-guided learning to efficiently train larger PLMs.")

@article{liu2021lifelong,
  title   = {Lifelong Intent Detection via Multi-Strategy Rebalancing},
  author  = {Qingbin Liu and Xiaoyan Yu and Shizhu He and Kang Liu and Jun Zhao},
  journal = {CoRR},
  volume  = {abs/2108.04445},
  year    = {2021},
  url     = {https://arxiv.org/abs/2108.04445},
  keywords={Continual Learning}
}
@String(liu2021lifelong="We propose the lifelong intent detection task to handle continually emerging user intents. And, we propose multistrategy rebalancing to address multiple adverse effects caused by the data imbalance problem.")


@inproceedings{DBLP:conf/emnlp/ArtetxeBGMOSLDI22,
  author    = {Mikel Artetxe and
               Shruti Bhosale and
               Naman Goyal and
               Todor Mihaylov and
               Myle Ott and
               Sam Shleifer and
               Xi Victoria Lin and
               Jingfei Du and
               Srinivasan Iyer and
               Ramakanth Pasunuru and
               Giridharan Anantharaman and
               Xian Li and
               Shuohui Chen and
               Halil Akin and
               Mandeep Baines and
               Louis Martin and
               Xing Zhou and
               Punit Singh Koura and
               Brian O'Horo and
               Jeffrey Wang and
               Luke Zettlemoyer and
               Mona T. Diab and
               Zornitsa Kozareva and
               Veselin Stoyanov},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Efficient Large Scale Language Modeling with Mixtures of Experts},
  booktitle = {EMNLP},
  pages     = {11699--11732},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.804},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ArtetxeBGMOSLDI22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Mixtures of Experts},
  plm = {MoE},
  code={https://github.com/facebookresearch/fairseq/tree/main/examples/moe_lm}
}

@article{DBLP:journals/corr/abs-2204-05862,
  author    = {Yuntao Bai and
               Andy Jones and
               Kamal Ndousse and
               Amanda Askell and
               Anna Chen and
               Nova DasSarma and
               Dawn Drain and
               Stanislav Fort and
               Deep Ganguli and
               Tom Henighan and
               Nicholas Joseph and
               Saurav Kadavath and
               Jackson Kernion and
               Tom Conerly and
               Sheer El Showk and
               Nelson Elhage and
               Zac Hatfield{-}Dodds and
               Danny Hernandez and
               Tristan Hume and
               Scott Johnston and
               Shauna Kravec and
               Liane Lovitt and
               Neel Nanda and
               Catherine Olsson and
               Dario Amodei and
               Tom B. Brown and
               Jack Clark and
               Sam McCandlish and
               Chris Olah and
               Benjamin Mann and
               Jared Kaplan},
  title     = {Training a Helpful and Harmless Assistant with Reinforcement Learning
               from Human Feedback},
  journal   = {CoRR},
  volume    = {abs/2204.05862},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2204.05862},
  doi       = {10.48550/arXiv.2204.05862},
  eprinttype = {arXiv},
  eprint    = {2204.05862},
  timestamp = {Tue, 19 Apr 2022 17:11:58 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2204-05862.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2210-02441,
  author    = {Simran Arora and
               Avanika Narayan and
               Mayee F. Chen and
               Laurel J. Orr and
               Neel Guha and
               Kush Bhatia and
               Ines Chami and
               Frederic Sala and
               Christopher R{\'{e}}},
  title     = {Ask Me Anything: {A} simple strategy for prompting language models},
  journal   = {CoRR},
  volume    = {abs/2210.02441},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.02441},
  doi       = {10.48550/arXiv.2210.02441},
  eprinttype = {arXiv},
  eprint    = {2210.02441},
  timestamp = {Fri, 07 Oct 2022 15:24:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-02441.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2302-11382,
  author    = {Jules White and
               Quchen Fu and
               Sam Hays and
               Michael Sandborn and
               Carlos Olea and
               Henry Gilbert and
               Ashraf Elnashar and
               Jesse Spencer{-}Smith and
               Douglas C. Schmidt},
  title     = {A Prompt Pattern Catalog to Enhance Prompt Engineering with ChatGPT},
  journal   = {CoRR},
  volume    = {abs/2302.11382},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.11382},
  doi       = {10.48550/arXiv.2302.11382},
  eprinttype = {arXiv},
  eprint    = {2302.11382},
  timestamp = {Fri, 24 Feb 2023 11:55:23 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-11382.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2302-09051,
  author    = {Xavier Daull and
               Patrice Bellot and
               Emmanuel Bruno and
               Vincent Martin and
               Elisabeth Murisasco},
  title     = {Complex {QA} and language models hybrid architectures, Survey},
  journal   = {CoRR},
  volume    = {abs/2302.09051},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.09051},
  doi       = {10.48550/arXiv.2302.09051},
  eprinttype = {arXiv},
  eprint    = {2302.09051},
  timestamp = {Thu, 23 Feb 2023 16:02:44 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-09051.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey}
}

@article{DBLP:journals/corr/abs-2301-13867,
  author    = {Simon Frieder and
               Luca Pinchetti and
               Ryan{-}Rhys Griffiths and
               Tommaso Salvatori and
               Thomas Lukasiewicz and
               Philipp Christian Petersen and
               Alexis Chevalier and
               Julius Berner},
  title     = {Mathematical Capabilities of ChatGPT},
  journal   = {CoRR},
  volume    = {abs/2301.13867},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.13867},
  doi       = {10.48550/arXiv.2301.13867},
  eprinttype = {arXiv},
  eprint    = {2301.13867},
  timestamp = {Thu, 02 Feb 2023 12:02:45 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-13867.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation}
}

@article{lee2023aligning,
  title={Aligning Text-to-Image Models using Human Feedback},
  author={Lee, Kimin and Liu, Hao and Ryu, Moonkyung and Watkins, Olivia and Du, Yuqing and Boutilier, Craig and Abbeel, Pieter and Ghavamzadeh, Mohammad and Gu, Shixiang Shane},
  journal={CoRR},
  year={2023},
  keywords={RLHF, Multimodal}
  url = {https://arxiv.org/abs/2302.12192}
}

@article{DBLP:journals/corr/abs-2205-11916,
  author    = {Takeshi Kojima and
               Shixiang Shane Gu and
               Machel Reid and
               Yutaka Matsuo and
               Yusuke Iwasawa},
  title     = {Large Language Models are Zero-Shot Reasoners},
  journal   = {CoRR},
  volume    = {abs/2205.11916},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2205.11916},
  doi       = {10.48550/arXiv.2205.11916},
  eprinttype = {arXiv},
  eprint    = {2205.11916},
  timestamp = {Tue, 16 Aug 2022 23:07:05 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2205-11916.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2205-09712,
  author    = {Antonia Creswell and
               Murray Shanahan and
               Irina Higgins},
  title     = {Selection-Inference: Exploiting Large Language Models for Interpretable
               Logical Reasoning},
  journal   = {CoRR},
  volume    = {abs/2205.09712},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2205.09712},
  doi       = {10.48550/arXiv.2205.09712},
  eprinttype = {arXiv},
  eprint    = {2205.09712},
  timestamp = {Mon, 23 May 2022 14:22:18 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2205-09712.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}


@article{DBLP:journals/corr/abs-2206-07682,
  author    = {Jason Wei and
               Yi Tay and
               Rishi Bommasani and
               Colin Raffel and
               Barret Zoph and
               Sebastian Borgeaud and
               Dani Yogatama and
               Maarten Bosma and
               Denny Zhou and
               Donald Metzler and
               Ed H. Chi and
               Tatsunori Hashimoto and
               Oriol Vinyals and
               Percy Liang and
               Jeff Dean and
               William Fedus},
  title     = {Emergent Abilities of Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2206.07682},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2206.07682},
  doi       = {10.48550/arXiv.2206.07682},
  eprinttype = {arXiv},
  eprint    = {2206.07682},
  timestamp = {Tue, 21 Jun 2022 17:35:15 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2206-07682.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@inproceedings{DBLP:conf/kdd/ZhaoZGZZS0WLW22,
  author    = {Wayne Xin Zhao and
               Kun Zhou and
               Zheng Gong and
               Beichen Zhang and
               Yuanhang Zhou and
               Jing Sha and
               Zhigang Chen and
               Shijin Wang and
               Cong Liu and
               Ji{-}Rong Wen},
  editor    = {Aidong Zhang and
               Huzefa Rangwala},
  title     = {JiuZhang: {A} Chinese Pre-trained Language Model for Mathematical
               Problem Understanding},
  booktitle = {KDD},
  pages     = {4571--4581},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3534678.3539131},
  doi       = {10.1145/3534678.3539131},
  timestamp = {Tue, 16 Aug 2022 14:34:55 +0200},
  biburl    = {https://dblp.org/rec/conf/kdd/ZhaoZGZZS0WLW22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought, Arithmetic Reasoning}
}

@article{DBLP:journals/corr/abs-2302-12246,
  author    = {Shizhe Diao and
               Pengcheng Wang and
               Yong Lin and
               Tong Zhang},
  title     = {Active Prompting with Chain-of-Thought for Large Language Models},
  journal   = {CoRR},
  volume    = {abs/2302.12246},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.12246},
  doi       = {10.48550/arXiv.2302.12246},
  eprinttype = {arXiv},
  eprint    = {2302.12246},
  timestamp = {Tue, 28 Feb 2023 14:02:05 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-12246.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2212-10071,
  author    = {Namgyu Ho and
               Laura Schmid and
               Se{-}Young Yun},
  title     = {Large Language Models Are Reasoning Teachers},
  journal   = {CoRR},
  volume    = {abs/2212.10071},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10071},
  doi       = {10.48550/arXiv.2212.10071},
  eprinttype = {arXiv},
  eprint    = {2212.10071},
  timestamp = {Tue, 03 Jan 2023 15:59:43 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10071.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2212-09561,
  author    = {Yixuan Weng and
               Minjun Zhu and
               Shizhu He and
               Kang Liu and
               Jun Zhao},
  title     = {Large Language Models are reasoners with Self-Verification},
  journal   = {CoRR},
  volume    = {abs/2212.09561},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.09561},
  doi       = {10.48550/arXiv.2212.09561},
  eprinttype = {arXiv},
  eprint    = {2212.09561},
  timestamp = {Tue, 03 Jan 2023 15:59:43 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-09561.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2212-09597,
  author    = {Shuofei Qiao and
               Yixin Ou and
               Ningyu Zhang and
               Xiang Chen and
               Yunzhi Yao and
               Shumin Deng and
               Chuanqi Tan and
               Fei Huang and
               Huajun Chen},
  title     = {Reasoning with Language Model Prompting: {A} Survey},
  journal   = {CoRR},
  volume    = {abs/2212.09597},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.09597},
  doi       = {10.48550/arXiv.2212.09597},
  eprinttype = {arXiv},
  eprint    = {2212.09597},
  timestamp = {Thu, 26 Jan 2023 17:27:32 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-09597.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought, Survey}
}

@article{DBLP:journals/corr/abs-2211-10435,
  author    = {Luyu Gao and
               Aman Madaan and
               Shuyan Zhou and
               Uri Alon and
               Pengfei Liu and
               Yiming Yang and
               Jamie Callan and
               Graham Neubig},
  title     = {{PAL:} Program-aided Language Models},
  journal   = {CoRR},
  volume    = {abs/2211.10435},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.10435},
  doi       = {10.48550/arXiv.2211.10435},
  eprinttype = {arXiv},
  eprint    = {2211.10435},
  timestamp = {Thu, 24 Nov 2022 15:52:33 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-10435.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2210-06710,
  author    = {Wenhu Chen},
  title     = {Large Language Models are few(1)-shot Table Reasoners},
  journal   = {CoRR},
  volume    = {abs/2210.06710},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.06710},
  doi       = {10.48550/arXiv.2210.06710},
  eprinttype = {arXiv},
  eprint    = {2210.06710},
  timestamp = {Tue, 18 Oct 2022 15:06:52 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-06710.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2210-11610,
  author    = {Jiaxin Huang and
               Shixiang Shane Gu and
               Le Hou and
               Yuexin Wu and
               Xuezhi Wang and
               Hongkun Yu and
               Jiawei Han},
  title     = {Large Language Models Can Self-Improve},
  journal   = {CoRR},
  volume    = {abs/2210.11610},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.11610},
  doi       = {10.48550/arXiv.2210.11610},
  eprinttype = {arXiv},
  eprint    = {2210.11610},
  timestamp = {Tue, 25 Oct 2022 14:25:08 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-11610.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@inproceedings{DBLP:conf/naacl/ZuoZLHZC22,
  author    = {Simiao Zuo and
               Qingru Zhang and
               Chen Liang and
               Pengcheng He and
               Tuo Zhao and
               Weizhu Chen},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {MoEBERT: from {BERT} to Mixture-of-Experts via Importance-Guided Adaptation},
  booktitle = {NAACL},
  pages     = {1610--1623},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.116},
  doi       = {10.18653/v1/2022.naacl-main.116},
  timestamp = {Mon, 01 Aug 2022 16:27:57 +0200},
  biburl    = {https://dblp.org/rec/conf/naacl/ZuoZLHZC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Mixtures of Experts}
}

@article{DBLP:journals/corr/abs-2212-05055,
  author    = {Aran Komatsuzaki and
               Joan Puigcerver and
               James Lee{-}Thorp and
               Carlos Riquelme Ruiz and
               Basil Mustafa and
               Joshua Ainslie and
               Yi Tay and
               Mostafa Dehghani and
               Neil Houlsby},
  title     = {Sparse Upcycling: Training Mixture-of-Experts from Dense Checkpoints},
  journal   = {CoRR},
  volume    = {abs/2212.05055},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.05055},
  doi       = {10.48550/arXiv.2212.05055},
  eprinttype = {arXiv},
  eprint    = {2212.05055},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-05055.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Mixtures of Experts}
}

@article{DBLP:journals/corr/abs-2210-01351,
  author    = {Chen Liang and
               Simiao Zuo and
               Qingru Zhang and
               Pengcheng He and
               Weizhu Chen and
               Tuo Zhao},
  title     = {Less is More: Task-aware Layer-wise Distillation for Language Model
               Compression},
  journal   = {CoRR},
  volume    = {abs/2210.01351},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.01351},
  doi       = {10.48550/arXiv.2210.01351},
  eprinttype = {arXiv},
  eprint    = {2210.01351},
  timestamp = {Fri, 07 Oct 2022 15:24:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-01351.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Distillation}
}

@article{DBLP:journals/corr/abs-2210-03885,
  author    = {Tao Zhong and
               Zhixiang Chi and
               Li Gu and
               Yang Wang and
               Yuanhao Yu and
               Jin Tang},
  title     = {Meta-DMoE: Adapting to Domain Shift by Meta-Distillation from Mixture-of-Experts},
  journal   = {CoRR},
  volume    = {abs/2210.03885},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.03885},
  doi       = {10.48550/arXiv.2210.03885},
  eprinttype = {arXiv},
  eprint    = {2210.03885},
  timestamp = {Fri, 30 Dec 2022 23:08:59 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-03885.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Mixtures of Experts, Knowledge Distillation}
}

@article{DBLP:journals/corr/abs-2006-03654,
  author    = {Pengcheng He and
               Xiaodong Liu and
               Jianfeng Gao and
               Weizhu Chen},
  title     = {DeBERTa: Decoding-enhanced {BERT} with Disentangled Attention},
  journal   = {CoRR},
  volume    = {abs/2006.03654},
  year      = {2020},
  url       = {https://arxiv.org/abs/2006.03654},
  eprinttype = {arXiv},
  eprint    = {2006.03654},
  timestamp = {Mon, 30 May 2022 13:48:56 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2006-03654.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  plm={DeBERTa},
  keywords={Pre-Training Techniques}
}


@inproceedings{DBLP:conf:icml:IrieCS22,
  author    = {Kazuki Irie and
               R{\'{o}}bert Csord{\'{a}}s and
               J{\"{u}}rgen Schmidhuber},
  editor    = {Kamalika Chaudhuri and
               Stefanie Jegelka and
               Le Song and
               Csaba Szepesv{\'{a}}ri and
               Gang Niu and
               Sivan Sabato},
  title     = {The Dual Form of Neural Networks Revisited: Connecting Test Time Predictions
               to Training Patterns via Spotlights of Attention},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {162},
  pages     = {9639--9659},
  publisher = {{PMLR}},
  year      = {2022},
  url       = {https://proceedings.mlr.press/v162/irie22a.html},
  timestamp = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl    = {https://dblp.org/rec/conf/icml/IrieCS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}
@String(DBLP:conf:icml:IrieCS22="(1) 很有意思的一篇，回顾神经网络（NN）线性层Y=WX（省略偏置b）的原始形式与对偶形式，两种形式完全等价；
(2) 从对偶形式中可以发现，通过反向传播训练的NN线性层的输出主要是该层在训练期间的训练误差信号et的线性组合，其中权重是通过比较测试查询x和每个训练输入计算出来的；进一步可以得出，如果测试时输入的x和训练时的输入是正交的，那么梯度下降所得到的参数更新对于该样本x完全没有影响。")

@article{DBLP:journals/corr/abs-2302-08081,
  author    = {Xianjun Yang and
               Yan Li and
               Xinlu Zhang and
               Haifeng Chen and
               Wei Cheng},
  title     = {Exploring the Limits of ChatGPT for Query or Aspect-based Text Summarization},
  journal   = {CoRR},
  volume    = {abs/2302.08081},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.08081},
  doi       = {10.48550/arXiv.2302.08081},
  eprinttype = {arXiv},
  eprint    = {2302.08081},
  timestamp = {Mon, 20 Feb 2023 14:27:28 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-08081.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation}
}


@article{DBLP:journals/corr/abs-2302-12095,
  author    = {Jindong Wang and
               Xixu Hu and
               Wenxin Hou and
               Hao Chen and
               Runkai Zheng and
               Yidong Wang and
               Linyi Yang and
               Haojun Huang and
               Wei Ye and
               Xiubo Geng and
               Binxing Jiao and
               Yue Zhang and
               Xing Xie},
  title     = {On the Robustness of ChatGPT: An Adversarial and Out-of-distribution
               Perspective},
  journal   = {CoRR},
  volume    = {abs/2302.12095},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.12095},
  doi       = {10.48550/arXiv.2302.12095},
  eprinttype = {arXiv},
  eprint    = {2302.12095},
  timestamp = {Tue, 28 Feb 2023 14:02:05 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-12095.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation, Reliability}
}

@article{DBLP:journals/corr/abs-2302-13007,
  author    = {Haixing Dai and
               Zhengliang Liu and
               Wenxiong Liao and
               Xiaoke Huang and
               Zihao Wu and
               Lin Zhao and
               Wei Liu and
               Ninghao Liu and
               Sheng Li and
               Dajiang Zhu and
               Hongmin Cai and
               Quanzheng Li and
               Dinggang Shen and
               Tianming Liu and
               Xiang Li},
  title     = {ChatAug: Leveraging ChatGPT for Text Data Augmentation},
  journal   = {CoRR},
  volume    = {abs/2302.13007},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.13007},
  doi       = {10.48550/arXiv.2302.13007},
  eprinttype = {arXiv},
  eprint    = {2302.13007},
  timestamp = {Tue, 28 Feb 2023 14:02:05 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-13007.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Argumentation}
}

@inproceedings{DBLP:conf/emnlp/YooPKLP21,
  author    = {Kang Min Yoo and
               Dongju Park and
               Jaewook Kang and
               Sang{-}Woo Lee and
               Woo{-}Myoung Park},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {GPT3Mix: Leveraging Large-scale Language Models for Text Augmentation},
  booktitle = {EMNLP Findings},
  pages     = {2225--2239},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-emnlp.192},
  doi       = {10.18653/v1/2021.findings-emnlp.192},
  timestamp = {Tue, 31 May 2022 12:52:24 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/YooPKLP21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Argumentation}
}

@inproceedings{DBLP:conf/emnlp/ReimersG19,
  author    = {Nils Reimers and
               Iryna Gurevych},
  editor    = {Kentaro Inui and
               Jing Jiang and
               Vincent Ng and
               Xiaojun Wan},
  title     = {Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks},
  booktitle = {EMNLP},
  pages     = {3980--3990},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/D19-1410},
  doi       = {10.18653/v1/D19-1410},
  timestamp = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/ReimersG19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  plm={SBERT},
  keywords={Pre-Training Techniques}
}

@article{DBLP:journals/corr/abs-2107-03374,
  author    = {Mark Chen and
               Jerry Tworek and
               Heewoo Jun and
               Qiming Yuan and
               Henrique Pond{\'{e}} de Oliveira Pinto and
               Jared Kaplan and
               Harrison Edwards and
               Yuri Burda and
               Nicholas Joseph and
               Greg Brockman and
               Alex Ray and
               Raul Puri and
               Gretchen Krueger and
               Michael Petrov and
               Heidy Khlaaf and
               Girish Sastry and
               Pamela Mishkin and
               Brooke Chan and
               Scott Gray and
               Nick Ryder and
               Mikhail Pavlov and
               Alethea Power and
               Lukasz Kaiser and
               Mohammad Bavarian and
               Clemens Winter and
               Philippe Tillet and
               Felipe Petroski Such and
               Dave Cummings and
               Matthias Plappert and
               Fotios Chantzis and
               Elizabeth Barnes and
               Ariel Herbert{-}Voss and
               William Hebgen Guss and
               Alex Nichol and
               Alex Paino and
               Nikolas Tezak and
               Jie Tang and
               Igor Babuschkin and
               Suchir Balaji and
               Shantanu Jain and
               William Saunders and
               Christopher Hesse and
               Andrew N. Carr and
               Jan Leike and
               Joshua Achiam and
               Vedant Misra and
               Evan Morikawa and
               Alec Radford and
               Matthew Knight and
               Miles Brundage and
               Mira Murati and
               Katie Mayer and
               Peter Welinder and
               Bob McGrew and
               Dario Amodei and
               Sam McCandlish and
               Ilya Sutskever and
               Wojciech Zaremba},
  title     = {Evaluating Large Language Models Trained on Code},
  journal   = {CoRR},
  volume    = {abs/2107.03374},
  year      = {2021},
  url       = {https://arxiv.org/abs/2107.03374},
  eprinttype = {arXiv},
  eprint    = {2107.03374},
  timestamp = {Thu, 09 Feb 2023 14:04:35 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2107-03374.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  plm={Codex}
  keywords={Pre-Training Techniques}
}

@article{DBLP:journals/jmlr/RaffelSRLNMZLL20,
  author    = {Colin Raffel and
               Noam Shazeer and
               Adam Roberts and
               Katherine Lee and
               Sharan Narang and
               Michael Matena and
               Yanqi Zhou and
               Wei Li and
               Peter J. Liu},
  title     = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text
               Transformer},
  journal   = {JMLR},
  volume    = {21},
  pages     = {140:1--140:67},
  year      = {2020},
  url       = {http://jmlr.org/papers/v21/20-074.html},
  timestamp = {Fri, 05 Feb 2021 15:43:41 +0100},
  biburl    = {https://dblp.org/rec/journals/jmlr/RaffelSRLNMZLL20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques},
  plm={T5}
}

@article{DBLP:journals/corr/abs-2205-01068,
  author    = {Susan Zhang and
               Stephen Roller and
               Naman Goyal and
               Mikel Artetxe and
               Moya Chen and
               Shuohui Chen and
               Christopher Dewan and
               Mona T. Diab and
               Xian Li and
               Xi Victoria Lin and
               Todor Mihaylov and
               Myle Ott and
               Sam Shleifer and
               Kurt Shuster and
               Daniel Simig and
               Punit Singh Koura and
               Anjali Sridhar and
               Tianlu Wang and
               Luke Zettlemoyer},
  title     = {{OPT:} Open Pre-trained Transformer Language Models},
  journal   = {CoRR},
  volume    = {abs/2205.01068},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2205.01068},
  doi       = {10.48550/arXiv.2205.01068},
  eprinttype = {arXiv},
  eprint    = {2205.01068},
  timestamp = {Thu, 22 Sep 2022 19:27:06 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2205-01068.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques},
  plm={OPT}
}

@article{DBLP:journals/corr/abs-2302-12822,
  author    = {Kashun Shum and
               Shizhe Diao and
               Tong Zhang},
  title     = {Automatic Prompt Augmentation and Selection with Chain-of-Thought
               from Labeled Data},
  journal   = {CoRR},
  volume    = {abs/2302.12822},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.12822},
  doi       = {10.48550/arXiv.2302.12822},
  eprinttype = {arXiv},
  eprint    = {2302.12822},
  timestamp = {Tue, 28 Feb 2023 14:02:05 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-12822.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Chain of Thought}
}

@article{DBLP:journals/corr/abs-2301-04655,
  author    = {Roberto Gozalo{-}Brizuela and
               Eduardo C. Garrido{-}Merch{\'{a}}n},
  title     = {ChatGPT is not all you need. {A} State of the Art Review of large
               Generative {AI} models},
  journal   = {CoRR},
  volume    = {abs/2301.04655},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.04655},
  doi       = {10.48550/arXiv.2301.04655},
  eprinttype = {arXiv},
  eprint    = {2301.04655},
  timestamp = {Thu, 19 Jan 2023 15:40:01 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-04655.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation}
}

@article{DBLP:journals/corr/abs-2302-10198,
  author    = {Qihuang Zhong and
               Liang Ding and
               Juhua Liu and
               Bo Du and
               Dacheng Tao},
  title     = {Can ChatGPT Understand Too? {A} Comparative Study on ChatGPT and Fine-tuned
               {BERT}},
  journal   = {CoRR},
  volume    = {abs/2302.10198},
  year      = {2023},
  url       = {https://arxiv.org/abs/2302.10198},
  doi       = {10.48550/arXiv.2302.10198},
  eprinttype = {arXiv},
  eprint    = {2302.10198},
  timestamp = {Mon, 06 Mar 2023 16:35:10 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-10198.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation}
}


@article{driess2023palm,
  title={PaLM-E: An Embodied Multimodal Language Model},
  author={Driess, Danny and Xia, Fei and Sajjadi, Mehdi SM and Lynch, Corey and Chowdhery, Aakanksha and Ichter, Brian and Wahid, Ayzaan and Tompson, Jonathan and Vuong, Quan and Yu, Tianhe and others},
  journal={CoRR},
  year={2023},
  url={https://arxiv.org/abs/2303.03378},
  keywords={Multimodal},
  plm={PaLM-E}
}

@inproceedings{DBLP:conf/acl/WangICR21,
  author    = {Peifeng Wang and
               Filip Ilievski and
               Muhao Chen and
               Xiang Ren},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Do Language Models Perform Generalizable Commonsense Inference?},
  booktitle = {ACL Findings},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {3681--3688},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.322},
  doi       = {10.18653/v1/2021.findings-acl.322},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/WangICR21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org} ,
  code={https://github.com/wangpf3/LM-for-CommonsenseInference},
  keywords={Generalizability, Evaluation}
}

@article{DBLP:journals/corr/abs-2302-03154,
  author    = {J. D. Zamfirescu{-}Pereira and
               Bjoern Hartmann and
               Qian Yang},
  title     = {Conversation Regression Testing: {A} Design Technique for Prototyping
               Generalizable Prompt Strategies for Pre-trained Language Models},
  journal   = {CoRR},
  volume    = {abs/2302.03154},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.03154},
  doi       = {10.48550/arXiv.2302.03154},
  eprinttype = {arXiv},
  eprint    = {2302.03154},
  timestamp = {Fri, 10 Feb 2023 12:26:38 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-03154.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Generalizability}
}


@article{DBLP:journals/corr/abs-2206-05658,
  author    = {Hang Hua and
               Xingjian Li and
               Dejing Dou and
               Cheng{-}Zhong Xu and
               Jiebo Luo},
  title     = {Fine-tuning Pre-trained Language Models with Noise Stability Regularization},
  journal   = {CoRR},
  volume    = {abs/2206.05658},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2206.05658},
  doi       = {10.48550/arXiv.2206.05658},
  eprinttype = {arXiv},
  eprint    = {2206.05658},
  timestamp = {Wed, 07 Dec 2022 23:00:48 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2206-05658.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Generalizability}
}

@article{DBLP:journals/corr/abs-2210-01293,
  author    = {Batu Ozturkler and
               Nikolay Malkin and
               Zhen Wang and
               Nebojsa Jojic},
  title     = {ThinkSum: Probabilistic reasoning over sets using large language models},
  journal   = {CoRR},
  volume    = {abs/2210.01293},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.01293},
  doi       = {10.48550/arXiv.2210.01293},
  eprinttype = {arXiv},
  eprint    = {2210.01293},
  timestamp = {Fri, 07 Oct 2022 15:24:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-01293.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Reasoning}
}

@inproceedings{DBLP:conf/acl/CaoLHSYLXX20,
  author    = {Boxi Cao and
               Hongyu Lin and
               Xianpei Han and
               Le Sun and
               Lingyong Yan and
               Meng Liao and
               Tong Xue and
               Jin Xu},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Knowledgeable or Educated Guess? Revisiting Language Models as Knowledge
               Bases},
  booktitle = {ACL},
  pages     = {1860--1874},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.146},
  doi       = {10.18653/v1/2021.acl-long.146},
  timestamp = {Sun, 02 Oct 2022 15:53:42 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/CaoLHSYLXX20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}。
  keywords={Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/emnlp/PetroniRRLBWM19,
  author    = {Fabio Petroni and
               Tim Rockt{\"{a}}schel and
               Sebastian Riedel and
               Patrick S. H. Lewis and
               Anton Bakhtin and
               Yuxiang Wu and
               Alexander H. Miller},
  editor    = {Kentaro Inui and
               Jing Jiang and
               Vincent Ng and
               Xiaojun Wan},
  title     = {Language Models as Knowledge Bases?},
  booktitle = {EMNLP},
  pages     = {2463--2473},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/D19-1250},
  doi       = {10.18653/v1/D19-1250},
  timestamp = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/PetroniRRLBWM19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2303-01081,
  author    = {Mingxu Tao and
               Yansong Feng and
               Dongyan Zhao},
  title     = {Can {BERT} Refrain from Forgetting on Sequential Tasks? {A} Probing
               Study},
  journal   = {CoRR},
  volume    = {abs/2303.01081},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2303.01081},
  doi       = {10.48550/arXiv.2303.01081},
  eprinttype = {arXiv},
  eprint    = {2303.01081},
  timestamp = {Mon, 06 Mar 2023 16:51:26 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2303-01081.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Continual Learning}
}

@inproceedings{DBLP:conf/emnlp/JangYLYSHKS22,
  author    = {Joel Jang and
               Seonghyeon Ye and
               Changho Lee and
               Sohee Yang and
               Joongbo Shin and
               Janghoon Han and
               Gyeonghun Kim and
               Minjoon Seo},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {TemporalWiki: {A} Lifelong Benchmark for Training and Evaluating Ever-Evolving
               Language Models},
  booktitle = {EMNLP},
  pages     = {6237--6250},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.418},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/JangYLYSHKS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Continual Learning}
}

@inproceedings{DBLP:conf/icml/LiskaKGTSAdSZYG22,
  author    = {Adam Liska and
               Tom{\'{a}}s Kocisk{\'{y}} and
               Elena Gribovskaya and
               Tayfun Terzi and
               Eren Sezener and
               Devang Agrawal and
               Cyprien de Masson d'Autume and
               Tim Scholtes and
               Manzil Zaheer and
               Susannah Young and
               Ellen Gilsenan{-}McMahon and
               Sophia Austin and
               Phil Blunsom and
               Angeliki Lazaridou},
  editor    = {Kamalika Chaudhuri and
               Stefanie Jegelka and
               Le Song and
               Csaba Szepesv{\'{a}}ri and
               Gang Niu and
               Sivan Sabato},
  title     = {StreamingQA: {A} Benchmark for Adaptation to New Knowledge over Time
               in Question Answering Models},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {162},
  pages     = {13604--13622},
  publisher = {{PMLR}},
  year      = {2022},
  url       = {https://proceedings.mlr.press/v162/liska22a.html},
  timestamp = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl    = {https://dblp.org/rec/conf/icml/LiskaKGTSAdSZYG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Continual Learning}
}

@article{DBLP:journals/corr/abs-2302-00083,
  author    = {Ori Ram and
               Yoav Levine and
               Itay Dalmedigos and
               Dor Muhlgay and
               Amnon Shashua and
               Kevin Leyton{-}Brown and
               Yoav Shoham},
  title     = {In-Context Retrieval-Augmented Language Models},
  journal   = {CoRR},
  volume    = {abs/2302.00083},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.00083},
  doi       = {10.48550/arXiv.2302.00083},
  eprinttype = {arXiv},
  eprint    = {2302.00083},
  timestamp = {Thu, 09 Feb 2023 16:11:17 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-00083.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model}
}

@inproceedings{DBLP:conf/emnlp/ShinRLWS20,
  author    = {Taylor Shin and
               Yasaman Razeghi and
               Robert L. Logan IV and
               Eric Wallace and
               Sameer Singh},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {AutoPrompt: Eliciting Knowledge from Language Models with Automatically
               Generated Prompts},
  booktitle = {EMNLP},
  pages     = {4222--4235},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.346},
  doi       = {10.18653/v1/2020.emnlp-main.346},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ShinRLWS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Language Model as Knowledge Base}
}

@article{DBLP:journals/tacl/RogersKR20,
  author    = {Anna Rogers and
               Olga Kovaleva and
               Anna Rumshisky},
  title     = {A Primer in BERTology: What We Know About How {BERT} Works},
  journal   = {TACL},
  volume    = {8},
  pages     = {842--866},
  year      = {2020},
  url       = {https://doi.org/10.1162/tacl\_a\_00349},
  doi       = {10.1162/tacl\_a\_00349},
  timestamp = {Fri, 10 Jun 2022 10:35:17 +0200},
  biburl    = {https://dblp.org/rec/journals/tacl/RogersKR20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques}
}

@inproceedings{DBLP:conf/eacl/HeinzerlingI21,
  author    = {Benjamin Heinzerling and
               Kentaro Inui},
  editor    = {Paola Merlo and
               J{\"{o}}rg Tiedemann and
               Reut Tsarfaty},
  title     = {Language Models as Knowledge Bases: On Entity Representations, Storage
               Capacity, and Paraphrased Queries},
  booktitle = {EACL},
  pages     = {1772--1791},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.eacl-main.153},
  doi       = {10.18653/v1/2021.eacl-main.153},
  timestamp = {Thu, 20 Jan 2022 10:02:49 +0100},
  biburl    = {https://dblp.org/rec/conf/eacl/HeinzerlingI21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/emnlp/WangL00Z22,
  author    = {Chenhao Wang and
               Jiachun Li and
               Yubo Chen and
               Kang Liu and
               Jun Zhao},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {CN-AutoMIC: Distilling Chinese Commonsense Knowledge from Pretrained
               Language Models},
  booktitle = {EMNLP},
  pages     = {9253--9265},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.628},
  timestamp = {Fri, 03 Mar 2023 10:21:23 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/WangL00Z22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Distillation}
}

@article{DBLP:journals/corr/abs-2301-11293,
  author    = {Mehran Kazemi and
               Sid Mittal and
               Deepak Ramachandran},
  title     = {Understanding Finetuning for Factual Knowledge Extraction from Language
               Models},
  journal   = {CoRR},
  volume    = {abs/2301.11293},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.11293},
  doi       = {10.48550/arXiv.2301.11293},
  eprinttype = {arXiv},
  eprint    = {2301.11293},
  timestamp = {Tue, 31 Jan 2023 16:32:10 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-11293.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Language Model as Knowledge Base, Knowledge Generation}
}

@inproceedings{DBLP:conf/acl/CaoLHL022,
  author    = {Boxi Cao and
               Hongyu Lin and
               Xianpei Han and
               Fangchao Liu and
               Le Sun},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Can Prompt Probe Pretrained Language Models? Understanding the Invisible
               Risks from a Causal View},
  booktitle = {ACL},
  pages     = {5796--5808},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.398},
  doi       = {10.18653/v1/2022.acl-long.398},
  timestamp = {Mon, 01 Aug 2022 16:27:39 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/CaoLHL022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2002-08909,
  author    = {Kelvin Guu and
               Kenton Lee and
               Zora Tung and
               Panupong Pasupat and
               Ming{-}Wei Chang},
  title     = {{REALM:} Retrieval-Augmented Language Model Pre-Training},
  journal   = {CoRR},
  volume    = {abs/2002.08909},
  year      = {2020},
  url       = {https://arxiv.org/abs/2002.08909},
  eprinttype = {arXiv},
  eprint    = {2002.08909},
  timestamp = {Mon, 02 Mar 2020 16:46:06 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2002-08909.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model}
}

@inproceedings{DBLP:conf/nips/LewisPPPKGKLYR020,
  author    = {Patrick S. H. Lewis and
               Ethan Perez and
               Aleksandra Piktus and
               Fabio Petroni and
               Vladimir Karpukhin and
               Naman Goyal and
               Heinrich K{\"{u}}ttler and
               Mike Lewis and
               Wen{-}tau Yih and
               Tim Rockt{\"{a}}schel and
               Sebastian Riedel and
               Douwe Kiela},
  editor    = {Hugo Larochelle and
               Marc'Aurelio Ranzato and
               Raia Hadsell and
               Maria{-}Florina Balcan and
               Hsuan{-}Tien Lin},
  title     = {Retrieval-Augmented Generation for Knowledge-Intensive {NLP} Tasks},
  booktitle = {NeurIPS},
  year      = {2020},
  url       = {https://proceedings.neurips.cc/paper/2020/hash/6b493230205f780e1bc26945df7481e5-Abstract.html},
  timestamp = {Tue, 19 Jan 2021 15:57:07 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/LewisPPPKGKLYR020.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model}
}


@inproceedings{DBLP:conf/emnlp/CaoAT21,
  author    = {Nicola De Cao and
               Wilker Aziz and
               Ivan Titov},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Editing Factual Knowledge in Language Models},
  booktitle = {EMNLP},
  pages     = {6491--6506},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.522},
  doi       = {10.18653/v1/2021.emnlp-main.522},
  timestamp = {Sun, 02 Oct 2022 16:00:24 +0200},
  biburl    = {https://dblp.org/rec/conf/emnlp/CaoAT21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}

@inproceedings{DBLP:conf/iclr/MitchellLBFM22,
  author    = {Eric Mitchell and
               Charles Lin and
               Antoine Bosselut and
               Chelsea Finn and
               Christopher D. Manning},
  title     = {Fast Model Editing at Scale},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2022},
  url       = {https://openreview.net/forum?id=0DcZxeWfOPt},
  timestamp = {Sat, 20 Aug 2022 01:15:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/MitchellLBFM22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Editing}
}

@inproceedings{DBLP:conf/icml/MitchellLBMF22,
  author    = {Eric Mitchell and
               Charles Lin and
               Antoine Bosselut and
               Christopher D. Manning and
               Chelsea Finn},
  editor    = {Kamalika Chaudhuri and
               Stefanie Jegelka and
               Le Song and
               Csaba Szepesv{\'{a}}ri and
               Gang Niu and
               Sivan Sabato},
  title     = {Memory-Based Model Editing at Scale},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {162},
  pages     = {15817--15831},
  publisher = {{PMLR}},
  year      = {2022},
  url       = {https://proceedings.mlr.press/v162/mitchell22a.html},
  timestamp = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl    = {https://dblp.org/rec/conf/icml/MitchellLBMF22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Editing}
}

@inproceedings{meng2022locating,
  title={Locating and editing factual associations in gpt},
  author={Meng, Kevin and Bau, David and Andonian, Alex J and Belinkov, Yonatan},
  booktitle={NeurIPS},
  year={2022},
  url={https://openreview.net/forum?id=-h6WAS6eE4},
    keywords={Knowledge Editing}
}

@article{DBLP:journals/corr/abs-2202-01110,
  author    = {Huayang Li and
               Yixuan Su and
               Deng Cai and
               Yan Wang and
               Lemao Liu},
  title     = {A Survey on Retrieval-Augmented Text Generation},
  journal   = {CoRR},
  volume    = {abs/2202.01110},
  year      = {2022},
  url       = {https://arxiv.org/abs/2202.01110},
  eprinttype = {arXiv},
  eprint    = {2202.01110},
  timestamp = {Wed, 09 Feb 2022 15:43:34 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2202-01110.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey, Retrieval-Augmented Language Model}
}

@article{DBLP:journals/corr/abs-2211-12561,
  author    = {Michihiro Yasunaga and
               Armen Aghajanyan and
               Weijia Shi and
               Rich James and
               Jure Leskovec and
               Percy Liang and
               Mike Lewis and
               Luke Zettlemoyer and
               Wen{-}tau Yih},
  title     = {Retrieval-Augmented Multimodal Language Modeling},
  journal   = {CoRR},
  volume    = {abs/2211.12561},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.12561},
  doi       = {10.48550/arXiv.2211.12561},
  eprinttype = {arXiv},
  eprint    = {2211.12561},
  timestamp = {Tue, 29 Nov 2022 17:41:18 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-12561.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model, Multimodal}
}

@article{izacard2022atlas,
  title={Atlas: Few-shot learning with retrieval augmented language models},
  author={Izacard, Gautier and Lewis, Patrick and Lomeli, Maria and Hosseini, Lucas and Petroni, Fabio and Schick, Timo and Dwivedi-Yu, Jane and Joulin, Armand and Riedel, Sebastian and Grave, Edouard},
  journal={arXiv preprint arXiv},
  volume={2208},
  year={2022},
  url={https://arxiv.org/abs/2208.03299},
  keywords={Retrieval-Augmented Language Model}
}

@article{DBLP:journals/corr/abs-2301-07094,
  author    = {Haotian Liu and
               Kilho Son and
               Jianwei Yang and
               Ce Liu and
               Jianfeng Gao and
               Yong Jae Lee and
               Chunyuan Li},
  title     = {Learning Customized Visual Models with Retrieval-Augmented Knowledge},
  journal   = {CoRR},
  volume    = {abs/2301.07094},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.07094},
  doi       = {10.48550/arXiv.2301.07094},
  eprinttype = {arXiv},
  eprint    = {2301.07094},
  timestamp = {Thu, 19 Jan 2023 15:40:01 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-07094.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model, Multimodal}
}

@article{DBLP:journals/corr/abs-2301-12652,
  author    = {Weijia Shi and
               Sewon Min and
               Michihiro Yasunaga and
               Minjoon Seo and
               Rich James and
               Mike Lewis and
               Luke Zettlemoyer and
               Wen{-}tau Yih},
  title     = {{REPLUG:} Retrieval-Augmented Black-Box Language Models},
  journal   = {CoRR},
  volume    = {abs/2301.12652},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.12652},
  doi       = {10.48550/arXiv.2301.12652},
  eprinttype = {arXiv},
  eprint    = {2301.12652},
  timestamp = {Wed, 01 Feb 2023 14:38:31 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-12652.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model}
}

@article{DBLP:journals/corr/abs-2302-04858,
  author    = {Zhuolin Yang and
               Wei Ping and
               Zihan Liu and
               Vijay Korthikanti and
               Weili Nie and
               De{-}An Huang and
               Linxi Fan and
               Zhiding Yu and
               Shiyi Lan and
               Bo Li and
               Ming{-}Yu Liu and
               Yuke Zhu and
               Mohammad Shoeybi and
               Bryan Catanzaro and
               Chaowei Xiao and
               Anima Anandkumar},
  title     = {Re-ViLM: Retrieval-Augmented Visual Language Model for Zero and Few-Shot
               Image Captioning},
  journal   = {CoRR},
  volume    = {abs/2302.04858},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.04858},
  doi       = {10.48550/arXiv.2302.04858},
  eprinttype = {arXiv},
  eprint    = {2302.04858},
  timestamp = {Mon, 13 Feb 2023 14:23:40 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-04858.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
keywords={Retrieval-Augmented Language Model}
}

@inproceedings{DBLP:conf/emnlp/ZhongLC22,
  author    = {Zexuan Zhong and
               Tao Lei and
               Danqi Chen},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Training Language Models with Memory Augmentation},
  booktitle = {EMNLP},
  pages     = {5657--5673},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.382},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ZhongLC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model}
}

@inproceedings{DBLP:conf/icml/BorgeaudMHCRM0L22,
  author    = {Sebastian Borgeaud and
               Arthur Mensch and
               Jordan Hoffmann and
               Trevor Cai and
               Eliza Rutherford and
               Katie Millican and
               George van den Driessche and
               Jean{-}Baptiste Lespiau and
               Bogdan Damoc and
               Aidan Clark and
               Diego de Las Casas and
               Aurelia Guy and
               Jacob Menick and
               Roman Ring and
               Tom Hennigan and
               Saffron Huang and
               Loren Maggiore and
               Chris Jones and
               Albin Cassirer and
               Andy Brock and
               Michela Paganini and
               Geoffrey Irving and
               Oriol Vinyals and
               Simon Osindero and
               Karen Simonyan and
               Jack W. Rae and
               Erich Elsen and
               Laurent Sifre},
  editor    = {Kamalika Chaudhuri and
               Stefanie Jegelka and
               Le Song and
               Csaba Szepesv{\'{a}}ri and
               Gang Niu and
               Sivan Sabato},
  title     = {Improving Language Models by Retrieving from Trillions of Tokens},
  booktitle = {ICML},
  series    = {Proceedings of Machine Learning Research},
  volume    = {162},
  pages     = {2206--2240},
  publisher = {{PMLR}},
  year      = {2022},
  url       = {https://proceedings.mlr.press/v162/borgeaud22a.html},
  timestamp = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl    = {https://dblp.org/rec/conf/icml/BorgeaudMHCRM0L22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Retrieval-Augmented Language Model}
}

@article{DBLP:journals/corr/abs-2206-04624,
  author    = {Nayeon Lee and
               Wei Ping and
               Peng Xu and
               Mostofa Patwary and
               Mohammad Shoeybi and
               Bryan Catanzaro},
  title     = {Factuality Enhanced Language Models for Open-Ended Text Generation},
  journal   = {CoRR},
  volume    = {abs/2206.04624},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2206.04624},
  doi       = {10.48550/arXiv.2206.04624},
  eprinttype = {arXiv},
  eprint    = {2206.04624},
  timestamp = {Wed, 15 Jun 2022 13:43:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2206-04624.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={AIGC}
}


@inproceedings{DBLP:conf/emnlp/MadaanTCY22,
  author    = {Aman Madaan and
               Niket Tandon and
               Peter Clark and
               Yiming Yang},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Memory-assisted prompt editing to improve {GPT-3} after deployment},
  booktitle = {EMNLP},
  pages     = {2833--2861},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.183},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/MadaanTCY22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Knowledge Editing}
}

@article{DBLP:journals/corr/abs-2303-00046,
  author    = {Davis Brown and
               Charles Godfrey and
               Cody Nizinski and
               Jonathan Tu and
               Henry Kvinge},
  title     = {Robustness of edited neural networks},
  journal   = {CoRR},
  volume    = {abs/2303.00046},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2303.00046},
  doi       = {10.48550/arXiv.2303.00046},
  eprinttype = {arXiv},
  eprint    = {2303.00046},
  timestamp = {Mon, 06 Mar 2023 16:51:26 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2303-00046.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Editing}
}

@article{DBLP:journals/corr/abs-2211-11031,
  author    = {Thomas Hartvigsen and
               Swami Sankaranarayanan and
               Hamid Palangi and
               Yoon Kim and
               Marzyeh Ghassemi},
  title     = {Aging with {GRACE:} Lifelong Model Editing with Discrete Key-Value
               Adaptors},
  journal   = {CoRR},
  volume    = {abs/2211.11031},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.11031},
  doi       = {10.48550/arXiv.2211.11031},
  eprinttype = {arXiv},
  eprint    = {2211.11031},
  timestamp = {Thu, 24 Nov 2022 15:52:33 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-11031.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Editing}
}

@inproceedings{DBLP:conf/emnlp/DongDSXSL22,
  author    = {Qingxiu Dong and
               Damai Dai and
               Yifan Song and
               Jingjing Xu and
               Zhifang Sui and
               Lei Li},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Calibrating Factual Knowledge in Pretrained Language Models},
  booktitle = {EMNLP Findings},
  pages     = {5937--5947},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.438},
  timestamp = {Tue, 07 Feb 2023 17:10:52 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/DongDSXSL22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}


@article{DBLP:journals/corr/abs-2301-09785,
  author    = {Zeyu Huang and
               Yikang Shen and
               Xiaofeng Zhang and
               Jie Zhou and
               Wenge Rong and
               Zhang Xiong},
  title     = {Transformer-Patcher: One Mistake worth One Neuron},
  journal   = {CoRR},
  volume    = {abs/2301.09785},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.09785},
  doi       = {10.48550/arXiv.2301.09785},
  eprinttype = {arXiv},
  eprint    = {2301.09785},
  timestamp = {Thu, 26 Jan 2023 15:26:31 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-09785.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Editing}
}

@inproceedings{DBLP:conf/emnlp/ZhaoZXZ022,
  author    = {Ruilin Zhao and
               Feng Zhao and
               Guandong Xu and
               Sixiao Zhang and
               Hai Jin},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Can Language Models Serve as Temporal Knowledge Bases?},
  booktitle = {EMNLP Findings},
  pages     = {2024--2037},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.147},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ZhaoZXZ022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/kdd/LiuZSCQZ0DT22,
  author    = {Xiao Liu and
               Shiyu Zhao and
               Kai Su and
               Yukuo Cen and
               Jiezhong Qiu and
               Mengdi Zhang and
               Wei Wu and
               Yuxiao Dong and
               Jie Tang},
  editor    = {Aidong Zhang and
               Huzefa Rangwala},
  title     = {Mask and Reason: Pre-Training Knowledge Graph Transformers for Complex
               Logical Queries},
  booktitle = {KDD},
  pages     = {1120--1130},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3534678.3539472},
  doi       = {10.1145/3534678.3539472},
  timestamp = {Thu, 19 Jan 2023 15:08:26 +0100},
  biburl    = {https://dblp.org/rec/conf/kdd/LiuZSCQZ0DT22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Question Answering}
}

@inproceedings{DBLP:conf/acl/SaxenaKG22,
  author    = {Apoorv Saxena and
               Adrian Kochsiek and
               Rainer Gemulla},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Sequence-to-Sequence Knowledge Graph Completion and Question Answering},
  booktitle = {ACL},
  pages     = {2814--2828},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.201},
  doi       = {10.18653/v1/2022.acl-long.201},
  timestamp = {Mon, 01 Aug 2022 16:27:41 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/SaxenaKG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Question Answering}
}

@inproceedings{DBLP:conf/acl/00020FYWX0022,
  author    = {Wenhao Yu and
               Chenguang Zhu and
               Yuwei Fang and
               Donghan Yu and
               Shuohang Wang and
               Yichong Xu and
               Michael Zeng and
               Meng Jiang},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Dict-BERT: Enhancing Language Model Pre-training with Dictionary},
  booktitle = {ACL Findings},
  pages     = {1907--1918},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.findings-acl.150},
  doi       = {10.18653/v1/2022.findings-acl.150},
  timestamp = {Mon, 01 Aug 2022 16:27:43 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/00020FYWX0022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced}
}


@inproceedings{DBLP:conf/emnlp/SafaviK21,
  author    = {Tara Safavi and
               Danai Koutra},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {Relational World Knowledge Representation in Contextual Language Models:
               {A} Review},
  booktitle = {EMNLP},
  pages     = {1053--1067},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.81},
  doi       = {10.18653/v1/2021.emnlp-main.81},
  timestamp = {Thu, 20 Jan 2022 10:02:10 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/SafaviK21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey}
}

@article{DBLP:journals/corr/abs-2210-08901,
  author    = {Xuran Pan and
               Tianzhu Ye and
               Dongchen Han and
               Shiji Song and
               Gao Huang},
  title     = {Contrastive Language-Image Pre-Training with Knowledge Graphs},
  journal   = {CoRR},
  volume    = {abs/2210.08901},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.08901},
  doi       = {10.48550/arXiv.2210.08901},
  eprinttype = {arXiv},
  eprint    = {2210.08901},
  timestamp = {Wed, 19 Oct 2022 12:47:31 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-08901.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal}
}

@article{wu2023visual,
  title={Visual ChatGPT: Talking, Drawing and Editing with Visual Foundation Models},
  author={Wu, Chenfei and Yin, Shengming and Qi, Weizhen and Wang, Xiaodong and Tang, Zecheng and Duan, Nan},
  journal={CoRR},
  year={2023},
  url={https://arxiv.org/abs/2303.04671},
  keywords={Multimodal}
}

@article{DBLP:journals/corr/abs-2301-11916,
  author    = {Xinyi Wang and
               Wanrong Zhu and
               William Yang Wang},
  title     = {Large Language Models Are Implicitly Topic Models: Explaining and
               Finding Good Demonstrations for In-Context Learning},
  journal   = {CoRR},
  volume    = {abs/2301.11916},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2301.11916},
  doi       = {10.48550/arXiv.2301.11916},
  eprinttype = {arXiv},
  eprint    = {2301.11916},
  timestamp = {Tue, 31 Jan 2023 16:32:10 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2301-11916.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}

@article{imani2023mathprompter,
  title={MathPrompter: Mathematical Reasoning using Large Language Models},
  author={Imani, Shima and Du, Liang and Shrivastava, Harsh},
  journal={CoRR},
  year={2023},
  url={https://arxiv.org/abs/2303.05398},
  keywords={Reasoning}
}

@inproceedings{DBLP:conf/iclr/NewmanCR22,
  author    = {Benjamin Newman and
               Prafulla Kumar Choubey and
               Nazneen Rajani},
  title     = {P-Adapters: Robustly Extracting Factual Information from Language
               Models with Diverse Prompts},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2022},
  url       = {https://openreview.net/forum?id=DhzIU48OcZh},
  timestamp = {Sat, 20 Aug 2022 01:15:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/NewmanCR22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}

@inproceedings{DBLP:conf/acl/MilewskiLM22,
  author    = {Victor Milewski and
               Miryam de Lhoneux and
               Marie{-}Francine Moens},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Finding Structural Knowledge in Multimodal-BERT},
  booktitle = {ACL},
  pages     = {5658--5671},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.388},
  doi       = {10.18653/v1/2022.acl-long.388},
  timestamp = {Wed, 07 Dec 2022 23:10:02 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/MilewskiLM22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Language Model as Knowledge Base}
}


@article{openai2023technical,
  title={GPT-4 Technical Report},
  author={OpenAI},
    url = {https://cdn.openai.com/papers/gpt-4.pdf},
    year = {2023},
    booktitle = {OpenAI},
    keywords = {AIGC, Natural Language Understanding, Pre-Training Techniques},
    plm={GPT-4}
}

@article{openai2023system,
  title={GPT-4 System Card},
  author={OpenAI},
    url = {https://cdn.openai.com/papers/gpt-4-system-card.pdf},
    year = {2023},
    booktitle = {OpenAI},
    keywords = {AIGC, Natural Language Understanding, Pre-Training Techniques},
    plm={GPT-4}
}

@inproceedings{DBLP:conf/iclr/0001BYRLML22,
  author    = {Xikun Zhang and
               Antoine Bosselut and
               Michihiro Yasunaga and
               Hongyu Ren and
               Percy Liang and
               Christopher D. Manning and
               Jure Leskovec},
  title     = {GreaseLM: Graph REASoning Enhanced Language Models},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2022},
  url       = {https://openreview.net/forum?id=41e9o6cQPj},
  timestamp = {Sat, 20 Aug 2022 01:15:42 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/0001BYRLML22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced}
}

@article{DBLP:journals/corr/abs-2302-07842,
  author    = {Gr{\'{e}}goire Mialon and
               Roberto Dess{\`{\i}} and
               Maria Lomeli and
               Christoforos Nalmpantis and
               Ramakanth Pasunuru and
               Roberta Raileanu and
               Baptiste Rozi{\`{e}}re and
               Timo Schick and
               Jane Dwivedi{-}Yu and
               Asli Celikyilmaz and
               Edouard Grave and
               Yann LeCun and
               Thomas Scialom},
  title     = {Augmented Language Models: a Survey},
  journal   = {CoRR},
  volume    = {abs/2302.07842},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.07842},
  doi       = {10.48550/arXiv.2302.07842},
  eprinttype = {arXiv},
  eprint    = {2302.07842},
  timestamp = {Mon, 20 Feb 2023 14:27:28 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-07842.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey}
}

@inproceedings{DBLP:conf/acl/KhashabiBCH22,
  author    = {Daniel Khashabi and
               Chitta Baral and
               Yejin Choi and
               Hannaneh Hajishirzi},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Reframing Instructional Prompts to GPTk's Language},
  booktitle = {ACL Findings},
  pages     = {589--612},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.findings-acl.50},
  doi       = {10.18653/v1/2022.findings-acl.50},
  timestamp = {Mon, 01 Aug 2022 16:27:50 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/KhashabiBCH22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@inproceedings{DBLP:conf/acl/0010LLWWBCH22,
  author    = {Jiacheng Liu and
               Alisa Liu and
               Ximing Lu and
               Sean Welleck and
               Peter West and
               Ronan Le Bras and
               Yejin Choi and
               Hannaneh Hajishirzi},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Generated Knowledge Prompting for Commonsense Reasoning},
  booktitle = {ACL},
  pages     = {3154--3169},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.225},
  doi       = {10.18653/v1/2022.acl-long.225},
  timestamp = {Mon, 05 Dec 2022 16:59:59 +0100},
  biburl    = {https://dblp.org/rec/conf/acl/0010LLWWBCH22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}

@inproceedings{DBLP:conf/emnlp/0010HLHWHC22,
  author    = {Jiacheng Liu and
               Skyler Hallinan and
               Ximing Lu and
               Pengfei He and
               Sean Welleck and
               Hannaneh Hajishirzi and
               Yejin Choi},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Rainier: Reinforced Knowledge Introspector for Commonsense Question
               Answering},
  booktitle = {EMNLP},
  pages     = {8938--8958},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.611},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/0010HLHWHC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}

@inproceedings{DBLP:conf/naacl/WestBHHJBLWC22,
  author    = {Peter West and
               Chandra Bhagavatula and
               Jack Hessel and
               Jena D. Hwang and
               Liwei Jiang and
               Ronan Le Bras and
               Ximing Lu and
               Sean Welleck and
               Yejin Choi},
  editor    = {Marine Carpuat and
               Marie{-}Catherine de Marneffe and
               Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title     = {Symbolic Knowledge Distillation: from General Language Models to Commonsense
               Models},
  booktitle = {NAACL},
  pages     = {4602--4625},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.naacl-main.341},
  doi       = {10.18653/v1/2022.naacl-main.341},
  timestamp = {Mon, 05 Dec 2022 16:59:59 +0100},
  biburl    = {https://dblp.org/rec/conf/naacl/WestBHHJBLWC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}

@article{DBLP:journals/corr/abs-2212-09246,
  author    = {Chandra Bhagavatula and
               Jena D. Hwang and
               Doug Downey and
               Ronan Le Bras and
               Ximing Lu and
               Keisuke Sakaguchi and
               Swabha Swayamdipta and
               Peter West and
               Yejin Choi},
  title     = {{I2D2:} Inductive Knowledge Distillation with NeuroLogic and Self-Imitation},
  journal   = {CoRR},
  volume    = {abs/2212.09246},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.09246},
  doi       = {10.48550/arXiv.2212.09246},
  eprinttype = {arXiv},
  eprint    = {2212.09246},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-09246.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Generation}
}

@article{DBLP:journals/corr/abs-2207-13332,
  author    = {Jungo Kasai and
               Keisuke Sakaguchi and
               Yoichi Takahashi and
               Ronan Le Bras and
               Akari Asai and
               Xinyan Yu and
               Dragomir R. Radev and
               Noah A. Smith and
               Yejin Choi and
               Kentaro Inui},
  title     = {RealTime {QA:} What's the Answer Right Now?},
  journal   = {CoRR},
  volume    = {abs/2207.13332},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2207.13332},
  doi       = {10.48550/arXiv.2207.13332},
  eprinttype = {arXiv},
  eprint    = {2207.13332},
  timestamp = {Mon, 05 Dec 2022 16:59:59 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2207-13332.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Question Answering}
}

@inproceedings{DBLP:conf/acl/ZellersHBFC19,
  author    = {Rowan Zellers and
               Ari Holtzman and
               Yonatan Bisk and
               Ali Farhadi and
               Yejin Choi},
  editor    = {Anna Korhonen and
               David R. Traum and
               Llu{\'{\i}}s M{\`{a}}rquez},
  title     = {HellaSwag: Can a Machine Really Finish Your Sentence?},
  booktitle = {},
  pages     = {4791--4800},
  publisher = {Association for Computational Linguistics},
  year      = {2019},
  url       = {https://doi.org/10.18653/v1/p19-1472},
  doi       = {10.18653/v1/p19-1472},
  timestamp = {Fri, 06 Aug 2021 00:41:01 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/ZellersHBFC19.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Others},
  code={https://rowanzellers.com/hellaswag}
}

@article{DBLP:journals/corr/abs-2211-00053,
  author    = {Sean Welleck and
               Ximing Lu and
               Peter West and
               Faeze Brahman and
               Tianxiao Shen and
               Daniel Khashabi and
               Yejin Choi},
  title     = {Generating Sequences by Learning to Self-Correct},
  journal   = {CoRR},
  volume    = {abs/2211.00053},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2211.00053},
  doi       = {10.48550/arXiv.2211.00053},
  eprinttype = {arXiv},
  eprint    = {2211.00053},
  timestamp = {Fri, 04 Nov 2022 13:48:49 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2211-00053.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Quality}
}

@article{DBLP:journals/corr/abs-2210-01241,
  author    = {Rajkumar Ramamurthy and
               Prithviraj Ammanabrolu and
               Kiant{\'{e}} Brantley and
               Jack Hessel and
               Rafet Sifa and
               Christian Bauckhage and
               Hannaneh Hajishirzi and
               Yejin Choi},
  title     = {Is Reinforcement Learning (Not) for Natural Language Processing?:
               Benchmarks, Baselines, and Building Blocks for Natural Language Policy
               Optimization},
  journal   = {CoRR},
  volume    = {abs/2210.01241},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.01241},
  doi       = {10.48550/arXiv.2210.01241},
  eprinttype = {arXiv},
  eprint    = {2210.01241},
  timestamp = {Fri, 07 Oct 2022 15:24:59 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-01241.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2205-13636,
  author    = {Ximing Lu and
               Sean Welleck and
               Liwei Jiang and
               Jack Hessel and
               Lianhui Qin and
               Peter West and
               Prithviraj Ammanabrolu and
               Yejin Choi},
  title     = {Quark: Controllable Text Generation with Reinforced Unlearning},
  journal   = {CoRR},
  volume    = {abs/2205.13636},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2205.13636},
  doi       = {10.48550/arXiv.2205.13636},
  eprinttype = {arXiv},
  eprint    = {2205.13636},
  timestamp = {Tue, 31 May 2022 15:14:51 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2205-13636.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/emnlp/ZhouKLLHPR21,
  author    = {Pei Zhou and
               Rahul Khanna and
               Seyeon Lee and
               Bill Yuchen Lin and
               Daniel Ho and
               Jay Pujara and
               Xiang Ren},
  editor    = {Marie{-}Francine Moens and
               Xuanjing Huang and
               Lucia Specia and
               Scott Wen{-}tau Yih},
  title     = {{RICA:} Evaluating Robust Inference Capabilities Based on Commonsense
               Axioms},
  booktitle = {EMNLP},
  pages     = {7560--7579},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.emnlp-main.598},
  doi       = {10.18653/v1/2021.emnlp-main.598},
  timestamp = {Thu, 20 Jan 2022 10:02:20 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/ZhouKLLHPR21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation}
}

@inproceedings{DBLP:conf/emnlp/YinBMLC22,
  author    = {Da Yin and
               Hritik Bansal and
               Masoud Monajatipoor and
               Liunian Harold Li and
               Kai{-}Wei Chang},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {GeoMLAMA: Geo-Diverse Commonsense Probing on Multilingual Pre-Trained
               Language Models},
  booktitle = {EMNLP},
  pages     = {2039--2055},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.132},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/YinBMLC22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multilingual, Evaluation}
}

@inproceedings{DBLP:conf/emnlp/0001L022,
  author    = {Soumya Sanyal and
               Zeyi Liao and
               Xiang Ren},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {RobustLR: {A} Diagnostic Benchmark for Evaluating Logical Robustness
               of Deductive Reasoners},
  booktitle = {EMNLP},
  pages     = {9614--9631},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.653},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/0001L022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation, Reasoning}
}

@inproceedings{DBLP:conf/acl/ChoiCL22a,
  author    = {Dongha Choi and
               Hongseok Choi and
               Hyunju Lee},
  editor    = {Smaranda Muresan and
               Preslav Nakov and
               Aline Villavicencio},
  title     = {Domain Knowledge Transferring for Pre-trained Language Model via Calibrated
               Activation Boundary Distillation},
  booktitle = {ACL},
  pages     = {1658--1669},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://doi.org/10.18653/v1/2022.acl-long.116},
  doi       = {10.18653/v1/2022.acl-long.116},
  timestamp = {Mon, 01 Aug 2022 16:27:48 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/ChoiCL22a.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Distillation}
}

@inproceedings{DBLP:conf/aaai/Bhargava022,
  author    = {Prajjwal Bhargava and
               Vincent Ng},
  title     = {Commonsense Knowledge Reasoning and Generation with Pre-trained Language
               Models: {A} Survey},
  booktitle = {AAAI},
  pages     = {12317--12325},
  publisher = {{AAAI} Press},
  year      = {2022},
  url       = {https://ojs.aaai.org/index.php/AAAI/article/view/21496},
  timestamp = {Tue, 12 Jul 2022 14:14:21 +0200},
  biburl    = {https://dblp.org/rec/conf/aaai/Bhargava022.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey}
}

@inproceedings{DBLP:conf/iclr/ZhouLSL021,
  author    = {Wangchunshu Zhou and
               Dong{-}Ho Lee and
               Ravi Kiran Selvam and
               Seyeon Lee and
               Xiang Ren},
  title     = {Pre-training Text-to-Text Transformers for Concept-centric Common
               Sense},
  booktitle = {ICLR},
  publisher = {OpenReview.net},
  year      = {2021},
  url       = {https://openreview.net/forum?id=3k20LAiHYL2},
  timestamp = {Wed, 23 Jun 2021 17:36:40 +0200},
  biburl    = {https://dblp.org/rec/conf/iclr/ZhouLSL021.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/emnlp/LinZSZBCR20,
  author    = {Bill Yuchen Lin and
               Wangchunshu Zhou and
               Ming Shen and
               Pei Zhou and
               Chandra Bhagavatula and
               Yejin Choi and
               Xiang Ren},
  editor    = {Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {CommonGen: {A} Constrained Text Generation Challenge for Generative
               Commonsense Reasoning},
  booktitle = {EMNLP Findings},
  series    = {Findings of {ACL}},
  volume    = {{EMNLP} 2020},
  pages     = {1823--1840},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.165},
  doi       = {10.18653/v1/2020.findings-emnlp.165},
  timestamp = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/LinZSZBCR20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Controllable Text Generation}
}

@inproceedings{DBLP:conf/acl/0003W0D020,
  author    = {Yufei Wang and
               Ian D. Wood and
               Stephen Wan and
               Mark Dras and
               Mark Johnson},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Mention Flags {(MF):} Constraining Transformer-based Text Generators},
  booktitle = {ACL},
  pages     = {103--113},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.acl-long.9},
  doi       = {10.18653/v1/2021.acl-long.9},
  timestamp = {Sat, 09 Apr 2022 12:33:45 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/0003W0D020.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Controllable Text Generation}
}

@article{DBLP:journals/corr/abs-2209-10372,
  author    = {Hui Su and
               Xiao Zhou and
               Houjin Yu and
               Yuwen Chen and
               Zilin Zhu and
               Yang Yu and
               Jie Zhou},
  title     = {WeLM: {A} Well-Read Pre-trained Language Model for Chinese},
  journal   = {CoRR},
  volume    = {abs/2209.10372},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2209.10372},
  doi       = {10.48550/arXiv.2209.10372},
  eprinttype = {arXiv},
  eprint    = {2209.10372},
  timestamp = {Wed, 05 Oct 2022 08:25:52 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2209-10372.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Pre-Training Techniques},
  code={https://welm.weixin.qq.com/docs/api/}
}

@inproceedings{DBLP:conf/acl/ParanjapeMGHZ21,
  author    = {Bhargavi Paranjape and
               Julian Michael and
               Marjan Ghazvininejad and
               Hannaneh Hajishirzi and
               Luke Zettlemoyer},
  editor    = {Chengqing Zong and
               Fei Xia and
               Wenjie Li and
               Roberto Navigli},
  title     = {Prompting Contrastive Explanations for Commonsense Reasoning Tasks},
  booktitle = {ACL},
  series    = {Findings of {ACL}},
  volume    = {{ACL/IJCNLP} 2021},
  pages     = {4179--4192},
  publisher = {Association for Computational Linguistics},
  year      = {2021},
  url       = {https://doi.org/10.18653/v1/2021.findings-acl.366},
  doi       = {10.18653/v1/2021.findings-acl.366},
  timestamp = {Fri, 27 Aug 2021 08:39:19 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/ParanjapeMGHZ21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Interpretability/Explainability}
}

@inproceedings{DBLP:conf/nips/ChristianoLBMLA17,
  author    = {Paul F. Christiano and
               Jan Leike and
               Tom B. Brown and
               Miljan Martic and
               Shane Legg and
               Dario Amodei},
  editor    = {Isabelle Guyon and
               Ulrike von Luxburg and
               Samy Bengio and
               Hanna M. Wallach and
               Rob Fergus and
               S. V. N. Vishwanathan and
               Roman Garnett},
  title     = {Deep Reinforcement Learning from Human Preferences},
  booktitle = {NeurIPS},
  pages     = {4299--4307},
  year      = {2017},
  url       = {https://proceedings.neurips.cc/paper/2017/hash/d5e2c0adad503c91f91df240d0cd4e49-Abstract.html},
  timestamp = {Thu, 21 Jan 2021 15:15:21 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/ChristianoLBMLA17.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-1909-08593,
  author    = {Daniel M. Ziegler and
               Nisan Stiennon and
               Jeffrey Wu and
               Tom B. Brown and
               Alec Radford and
               Dario Amodei and
               Paul F. Christiano and
               Geoffrey Irving},
  title     = {Fine-Tuning Language Models from Human Preferences},
  journal   = {CoRR},
  volume    = {abs/1909.08593},
  year      = {2019},
  url       = {http://arxiv.org/abs/1909.08593},
  eprinttype = {arXiv},
  eprint    = {1909.08593},
  timestamp = {Thu, 01 Apr 2021 19:06:51 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1909-08593.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2112-09332,
  author    = {Reiichiro Nakano and
               Jacob Hilton and
               Suchir Balaji and
               Jeff Wu and
               Long Ouyang and
               Christina Kim and
               Christopher Hesse and
               Shantanu Jain and
               Vineet Kosaraju and
               William Saunders and
               Xu Jiang and
               Karl Cobbe and
               Tyna Eloundou and
               Gretchen Krueger and
               Kevin Button and
               Matthew Knight and
               Benjamin Chess and
               John Schulman},
  title     = {WebGPT: Browser-assisted question-answering with human feedback},
  journal   = {CoRR},
  volume    = {abs/2112.09332},
  year      = {2021},
  url       = {https://arxiv.org/abs/2112.09332},
  eprinttype = {arXiv},
  eprint    = {2112.09332},
  timestamp = {Mon, 03 Jan 2022 15:45:35 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2112-09332.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2203-11147,
  author    = {Jacob Menick and
               Maja Trebacz and
               Vladimir Mikulik and
               John Aslanides and
               H. Francis Song and
               Martin Chadwick and
               Mia Glaese and
               Susannah Young and
               Lucy Campbell{-}Gillingham and
               Geoffrey Irving and
               Nat McAleese},
  title     = {Teaching language models to support answers with verified quotes},
  journal   = {CoRR},
  volume    = {abs/2203.11147},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2203.11147},
  doi       = {10.48550/arXiv.2203.11147},
  eprinttype = {arXiv},
  eprint    = {2203.11147},
  timestamp = {Tue, 29 Mar 2022 18:07:24 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2203-11147.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@inproceedings{DBLP:conf/nips/StiennonO0ZLVRA20,
  author    = {Nisan Stiennon and
               Long Ouyang and
               Jeffrey Wu and
               Daniel M. Ziegler and
               Ryan Lowe and
               Chelsea Voss and
               Alec Radford and
               Dario Amodei and
               Paul F. Christiano},
  editor    = {Hugo Larochelle and
               Marc'Aurelio Ranzato and
               Raia Hadsell and
               Maria{-}Florina Balcan and
               Hsuan{-}Tien Lin},
  title     = {Learning to summarize with human feedback},
  booktitle = {NeurIPS},
  year      = {2020},
  url       = {https://proceedings.neurips.cc/paper/2020/hash/1f89885d556929e98d3ef9b86448f951-Abstract.html},
  timestamp = {Tue, 19 Jan 2021 15:57:45 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/StiennonO0ZLVRA20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2109-10862,
  author    = {Jeff Wu and
               Long Ouyang and
               Daniel M. Ziegler and
               Nisan Stiennon and
               Ryan Lowe and
               Jan Leike and
               Paul F. Christiano},
  title     = {Recursively Summarizing Books with Human Feedback},
  journal   = {CoRR},
  volume    = {abs/2109.10862},
  year      = {2021},
  url       = {https://arxiv.org/abs/2109.10862},
  eprinttype = {arXiv},
  eprint    = {2109.10862},
  timestamp = {Mon, 04 Oct 2021 08:57:17 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2109-10862.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2209-14375,
  author    = {Amelia Glaese and
               Nat McAleese and
               Maja Trebacz and
               John Aslanides and
               Vlad Firoiu and
               Timo Ewalds and
               Maribeth Rauh and
               Laura Weidinger and
               Martin Chadwick and
               Phoebe Thacker and
               Lucy Campbell{-}Gillingham and
               Jonathan Uesato and
               Po{-}Sen Huang and
               Ramona Comanescu and
               Fan Yang and
               Abigail See and
               Sumanth Dathathri and
               Rory Greig and
               Charlie Chen and
               Doug Fritz and
               Jaume Sanchez Elias and
               Richard Green and
               Sona Mokr{\'{a}} and
               Nicholas Fernando and
               Boxi Wu and
               Rachel Foley and
               Susannah Young and
               Iason Gabriel and
               William Isaac and
               John Mellor and
               Demis Hassabis and
               Koray Kavukcuoglu and
               Lisa Anne Hendricks and
               Geoffrey Irving},
  title     = {Improving alignment of dialogue agents via targeted human judgements},
  journal   = {CoRR},
  volume    = {abs/2209.14375},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2209.14375},
  doi       = {10.48550/arXiv.2209.14375},
  eprinttype = {arXiv},
  eprint    = {2209.14375},
  timestamp = {Thu, 06 Oct 2022 14:41:30 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2209-14375.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{gao2022scaling,
  title={Scaling Laws for Reward Model Overoptimization},
  author={Gao, Leo and Schulman, John and Hilton, Jacob},
  journal={CoRR},
  year={2022},
  url={https://arxiv.org/abs/2210.10760},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2209-07858,
  author    = {Deep Ganguli and
               Liane Lovitt and
               Jackson Kernion and
               Amanda Askell and
               Yuntao Bai and
               Saurav Kadavath and
               Ben Mann and
               Ethan Perez and
               Nicholas Schiefer and
               Kamal Ndousse and
               Andy Jones and
               Sam Bowman and
               Anna Chen and
               Tom Conerly and
               Nova DasSarma and
               Dawn Drain and
               Nelson Elhage and
               Sheer El Showk and
               Stanislav Fort and
               Zac Hatfield{-}Dodds and
               Tom Henighan and
               Danny Hernandez and
               Tristan Hume and
               Josh Jacobson and
               Scott Johnston and
               Shauna Kravec and
               Catherine Olsson and
               Sam Ringer and
               Eli Tran{-}Johnson and
               Dario Amodei and
               Tom Brown and
               Nicholas Joseph and
               Sam McCandlish and
               Chris Olah and
               Jared Kaplan and
               Jack Clark},
  title     = {Red Teaming Language Models to Reduce Harms: Methods, Scaling Behaviors,
               and Lessons Learned},
  journal   = {CoRR},
  volume    = {abs/2209.07858},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2209.07858},
  doi       = {10.48550/arXiv.2209.07858},
  eprinttype = {arXiv},
  eprint    = {2209.07858},
  timestamp = {Tue, 27 Sep 2022 16:29:43 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2209-07858.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2208-02294,
  author    = {Deborah Cohen and
               Moonkyung Ryu and
               Yinlam Chow and
               Orgad Keller and
               Ido Greenberg and
               Avinatan Hassidim and
               Michael Fink and
               Yossi Matias and
               Idan Szpektor and
               Craig Boutilier and
               Gal Elidan},
  title     = {Dynamic Planning in Open-Ended Dialogue using Reinforcement Learning},
  journal   = {CoRR},
  volume    = {abs/2208.02294},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2208.02294},
  doi       = {10.48550/arXiv.2208.02294},
  eprinttype = {arXiv},
  eprint    = {2208.02294},
  timestamp = {Tue, 09 Aug 2022 17:15:58 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2208-02294.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2203-02155,
  author    = {Long Ouyang and
               Jeff Wu and
               Xu Jiang and
               Diogo Almeida and
               Carroll L. Wainwright and
               Pamela Mishkin and
               Chong Zhang and
               Sandhini Agarwal and
               Katarina Slama and
               Alex Ray and
               John Schulman and
               Jacob Hilton and
               Fraser Kelton and
               Luke Miller and
               Maddie Simens and
               Amanda Askell and
               Peter Welinder and
               Paul F. Christiano and
               Jan Leike and
               Ryan Lowe},
  title     = {Training language models to follow instructions with human feedback},
  journal   = {CoRR},
  volume    = {abs/2203.02155},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2203.02155},
  doi       = {10.48550/arXiv.2203.02155},
  eprinttype = {arXiv},
  eprint    = {2203.02155},
  timestamp = {Wed, 16 Mar 2022 16:39:52 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2203-02155.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@inproceedings{DBLP:conf/emnlp/GaoZGBD20,
  author    = {Xiang Gao and
               Yizhe Zhang and
               Michel Galley and
               Chris Brockett and
               Bill Dolan},
  editor    = {Bonnie Webber and
               Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Dialogue Response Ranking Training with Large-Scale Human Feedback
               Data},
  booktitle = {EMNLP},
  pages     = {386--395},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.emnlp-main.28},
  doi       = {10.18653/v1/2020.emnlp-main.28},
  timestamp = {Fri, 24 Feb 2023 08:34:15 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/GaoZGBD20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/ijrr/BiyikLPLSS22,
  author    = {Erdem Biyik and
               Dylan P. Losey and
               Malayandi Palan and
               Nicholas C. Landolfi and
               Gleb Shevchuk and
               Dorsa Sadigh},
  title     = {Learning reward functions from diverse sources of human feedback:
               Optimally integrating demonstrations and preferences},
  journal   = {IJRR},
  volume    = {41},
  number    = {1},
  pages     = {45--67},
  year      = {2022},
  url       = {https://doi.org/10.1177/02783649211041652},
  doi       = {10.1177/02783649211041652},
  timestamp = {Mon, 25 Jul 2022 08:39:40 +0200},
  biburl    = {https://dblp.org/rec/journals/ijrr/BiyikLPLSS22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={RLHF}
}

@article{DBLP:journals/corr/abs-2302-12192,
  author    = {Kimin Lee and
               Hao Liu and
               Moonkyung Ryu and
               Olivia Watkins and
               Yuqing Du and
               Craig Boutilier and
               Pieter Abbeel and
               Mohammad Ghavamzadeh and
               Shixiang Shane Gu},
  title     = {Aligning Text-to-Image Models using Human Feedback},
  journal   = {CoRR},
  volume    = {abs/2302.12192},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.12192},
  doi       = {10.48550/arXiv.2302.12192},
  eprinttype = {arXiv},
  eprint    = {2302.12192},
  timestamp = {Tue, 28 Feb 2023 14:02:05 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-12192.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Multimodal, RLHF}
}

@article{DBLP:journals/corr/abs-2212-10539,
  author    = {Weijia Shi and
               Xiaochuang Han and
               Hila Gonen and
               Ari Holtzman and
               Yulia Tsvetkov and
               Luke Zettlemoyer},
  title     = {Toward Human Readable Prompt Tuning: Kubrick's The Shining is a good
               movie, and a good prompt too?},
  journal   = {CoRR},
  volume    = {abs/2212.10539},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10539},
  doi       = {10.48550/arXiv.2212.10539},
  eprinttype = {arXiv},
  eprint    = {2212.10539},
  timestamp = {Wed, 04 Jan 2023 16:01:37 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10539.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2212-10375,
  author    = {Zhiyong Wu and
               Yaoxiang Wang and
               Jiacheng Ye and
               Lingpeng Kong},
  title     = {Self-adaptive In-context Learning},
  journal   = {CoRR},
  volume    = {abs/2212.10375},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10375},
  doi       = {10.48550/arXiv.2212.10375},
  eprinttype = {arXiv},
  eprint    = {2212.10375},
  timestamp = {Tue, 03 Jan 2023 15:59:43 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10375.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}

@article{DBLP:journals/corr/abs-2203-09161,
  author    = {Ravsehaj Singh Puri and
               Swaroop Mishra and
               Mihir Parmar and
               Chitta Baral},
  title     = {How Many Data Samples is an Additional Instruction Worth?},
  journal   = {CoRR},
  volume    = {abs/2203.09161},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2203.09161},
  doi       = {10.48550/arXiv.2203.09161},
  eprinttype = {arXiv},
  eprint    = {2203.09161},
  timestamp = {Mon, 28 Mar 2022 17:09:43 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2203-09161.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Instruction Tuning}
}

@article{DBLP:journals/corr/abs-2303-07992,
  author    = {Yiming Tan and
               Dehai Min and
               Yu Li and
               Wenbo Li and
               Nan Hu and
               Yongrui Chen and
               Guilin Qi},
  title     = {Evaluation of ChatGPT as a Question Answering System for Answering
               Complex Questions},
  journal   = {CoRR},
  volume    = {abs/2303.07992},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2303.07992},
  doi       = {10.48550/arXiv.2303.07992},
  eprinttype = {arXiv},
  eprint    = {2303.07992},
  timestamp = {Mon, 20 Mar 2023 15:23:19 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2303-07992.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Evaluation, Question Answering}
}

@article{DBLP:journals/corr/abs-2302-13539,
  author    = {Xiaonan Li and
               Xipeng Qiu},
  title     = {Finding Supporting Examples for In-Context Learning},
  journal   = {CoRR},
  volume    = {abs/2302.13539},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2302.13539},
  doi       = {10.48550/arXiv.2302.13539},
  eprinttype = {arXiv},
  eprint    = {2302.13539},
  timestamp = {Tue, 28 Feb 2023 14:02:05 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2302-13539.bib},
  bibsourc = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}

@article{DBLP:journals/corr/abs-2212-10378,
  author    = {Ting{-}Yun Chang and
               Robin Jia},
  title     = {Careful Data Curation Stabilizes In-context Learning},
  journal   = {CoRR},
  volume    = {abs/2212.10378},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.10378},
  doi       = {10.48550/arXiv.2212.10378},
  eprinttype = {arXiv},
  eprint    = {2212.10378},
  timestamp = {Tue, 03 Jan 2023 15:59:43 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-10378.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}

@inproceedings{DBLP:conf/emnlp/Wang0LTQYSHG22,
  author    = {Jianing Wang and
               Chengyu Wang and
               Fuli Luo and
               Chuanqi Tan and
               Minghui Qiu and
               Fei Yang and
               Qiuhui Shi and
               Songfang Huang and
               Ming Gao},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Towards Unified Prompt Tuning for Few-shot Text Classification},
  booktitle = {EMNLP Findings},
  pages     = {524--536},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.findings-emnlp.37},
  timestamp = {Tue, 21 Mar 2023 20:56:04 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/Wang0LTQYSHG22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2210-12587,
  author    = {Xiangyu Peng and
               Chen Xing and
               Prafulla Kumar Choubey and
               Chien{-}Sheng Wu and
               Caiming Xiong},
  title     = {Model ensemble instead of prompt fusion: a sample-specific knowledge
               transfer method for few-shot prompt tuning},
  journal   = {CoRR},
  volume    = {abs/2210.12587},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.12587},
  doi       = {10.48550/arXiv.2210.12587},
  eprinttype = {arXiv},
  eprint    = {2210.12587},
  timestamp = {Fri, 28 Oct 2022 14:21:57 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-12587.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2212-09095,
  author    = {Hritik Bansal and
               Karthik Gopalakrishnan and
               Saket Dingliwal and
               Sravan Bodapati and
               Katrin Kirchhoff and
               Dan Roth},
  title     = {Rethinking the Role of Scale for In-Context Learning: An Interpretability-based
               Case Study at 66 Billion Scale},
  journal   = {CoRR},
  volume    = {abs/2212.09095},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.09095},
  doi       = {10.48550/arXiv.2212.09095},
  eprinttype = {arXiv},
  eprint    = {2212.09095},
  timestamp = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-09095.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning, Interpretability/Explainability}
}

@inproceedings{DBLP:conf/acl/HendrycksLWDKS20,
  author    = {Dan Hendrycks and
               Xiaoyuan Liu and
               Eric Wallace and
               Adam Dziedzic and
               Rishabh Krishnan and
               Dawn Song},
  editor    = {Dan Jurafsky and
               Joyce Chai and
               Natalie Schluter and
               Joel R. Tetreault},
  title     = {Pretrained Transformers Improve Out-of-Distribution Robustness},
  booktitle = {ACL},
  pages     = {2744--2751},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.acl-main.244},
  doi       = {10.18653/v1/2020.acl-main.244},
  timestamp = {Fri, 06 Aug 2021 00:40:57 +0200},
  biburl    = {https://dblp.org/rec/conf/acl/HendrycksLWDKS20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Robustness}
}

@article{DBLP:journals/corr/abs-2210-07663,
  author    = {Swaroop Mishra and
               Bhavdeep Singh Sachdeva and
               Chitta Baral},
  title     = {Pretrained Transformers Do not Always Improve Robustness},
  journal   = {CoRR},
  volume    = {abs/2210.07663},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2210.07663},
  doi       = {10.48550/arXiv.2210.07663},
  eprinttype = {arXiv},
  eprint    = {2210.07663},
  timestamp = {Tue, 18 Oct 2022 15:06:52 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2210-07663.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Robustness}
}

@inproceedings{DBLP:conf/emnlp/RudingerSHBFBSC20,
  author    = {Rachel Rudinger and
               Vered Shwartz and
               Jena D. Hwang and
               Chandra Bhagavatula and
               Maxwell Forbes and
               Ronan Le Bras and
               Noah A. Smith and
               Yejin Choi},
  editor    = {Trevor Cohn and
               Yulan He and
               Yang Liu},
  title     = {Thinking Like a Skeptic: Defeasible Inference in Natural Language},
  booktitle = {EMNLP Findings},
  series    = {Findings of {ACL}},
  volume    = {{EMNLP} 2020},
  pages     = {4661--4675},
  publisher = {Association for Computational Linguistics},
  year      = {2020},
  url       = {https://doi.org/10.18653/v1/2020.findings-emnlp.418},
  doi       = {10.18653/v1/2020.findings-emnlp.418},
  timestamp = {Mon, 05 Dec 2022 16:59:59 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/RudingerSHBFBSC20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Symbolic Reasoning}
}

@inproceedings{DBLP:conf/emnlp/SahaHRB22,
  author    = {Swarnadeep Saha and
               Peter Hase and
               Nazneen Rajani and
               Mohit Bansal},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {Are Hard Examples also Harder to Explain? {A} Study with Human and
               Model-Generated Explanations},
  booktitle = {EMNLP},
  pages     = {2121--2131},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.137},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/SahaHRB22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Interpretability/Explainability}
}

@inproceedings{DBLP:conf/nips/Welleck0BHCCC21,
  author    = {Sean Welleck and
               Jiacheng Liu and
               Ronan Le Bras and
               Hanna Hajishirzi and
               Yejin Choi and
               Kyunghyun Cho},
  editor    = {Joaquin Vanschoren and
               Sai{-}Kit Yeung},
  title     = {NaturalProofs: Mathematical Theorem Proving in Natural Language},
  booktitle = {NeurIPS},
  year      = {2021},
  url       = {https://datasets-benchmarks-proceedings.neurips.cc/paper/2021/hash/d9d4f495e875a2e075a1a4a6e1b9770f-Abstract-round1.html},
  timestamp = {Mon, 05 Dec 2022 16:59:59 +0100},
  biburl    = {https://dblp.org/rec/conf/nips/Welleck0BHCCC21.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}，
  keywords={Arithmetic Reasoning}
}

@article{DBLP:journals/corr/abs-2206-14858,
  author    = {Aitor Lewkowycz and
               Anders Andreassen and
               David Dohan and
               Ethan Dyer and
               Henryk Michalewski and
               Vinay V. Ramasesh and
               Ambrose Slone and
               Cem Anil and
               Imanol Schlag and
               Theo Gutman{-}Solo and
               Yuhuai Wu and
               Behnam Neyshabur and
               Guy Gur{-}Ari and
               Vedant Misra},
  title     = {Solving Quantitative Reasoning Problems with Language Models},
  journal   = {CoRR},
  volume    = {abs/2206.14858},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2206.14858},
  doi       = {10.48550/arXiv.2206.14858},
  eprinttype = {arXiv},
  eprint    = {2206.14858},
  timestamp = {Mon, 04 Jul 2022 16:22:19 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2206-14858.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Arithmetic Reasoning}
}

@inproceedings{DBLP:conf/emnlp/YeGLXF00K22,
  author    = {Jiacheng Ye and
               Jiahui Gao and
               Qintong Li and
               Hang Xu and
               Jiangtao Feng and
               Zhiyong Wu and
               Tao Yu and
               Lingpeng Kong},
  editor    = {Yoav Goldberg and
               Zornitsa Kozareva and
               Yue Zhang},
  title     = {ZeroGen: Efficient Zero-shot Learning via Dataset Generation},
  booktitle = {EMNLP},
  pages     = {11653--11669},
  publisher = {Association for Computational Linguistics},
  year      = {2022},
  url       = {https://aclanthology.org/2022.emnlp-main.801},
  timestamp = {Tue, 07 Feb 2023 17:10:51 +0100},
  biburl    = {https://dblp.org/rec/conf/emnlp/YeGLXF00K22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Generation}
}

@article{DBLP:journals/corr/abs-2202-04538,
  author    = {Yu Meng and
               Jiaxin Huang and
               Yu Zhang and
               Jiawei Han},
  title     = {Generating Training Data with Language Models: Towards Zero-Shot Language
               Understanding},
  journal   = {CoRR},
  volume    = {abs/2202.04538},
  year      = {2022},
  url       = {https://arxiv.org/abs/2202.04538},
  eprinttype = {arXiv},
  eprint    = {2202.04538},
  timestamp = {Wed, 02 Mar 2022 10:00:29 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2202-04538.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Data Generation, Natural Language Understanding}
}

@inproceedings{gaoself,
  title={Self-Guided Noise-Free Data Generation for Efficient Zero-Shot Learning},
  author={Gao, Jiahui and Pi, Renjie and Yong, LIN and Xu, Hang and Ye, Jiacheng and Wu, Zhiyong and ZHANG, WEIZHONG and Liang, Xiaodan and Li, Zhenguo and Kong, Lingpeng},
  booktitle={ICLR},
  year={2023},
  keywords={Data Generation},
  url={https://openreview.net/forum?id=h5OpjGd_lo6}
}

@article{DBLP:journals/corr/abs-2303-01580,
  author    = {Derek Chen and
               Celine Lee and
               Yunan Lu and
               Domenic Rosati and
               Zhou Yu},
  title     = {Mixture of Soft Prompts for Controllable Data Generation},
  journal   = {CoRR},
  volume    = {abs/2303.01580},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2303.01580},
  doi       = {10.48550/arXiv.2303.01580},
  eprinttype = {arXiv},
  eprint    = {2303.01580},
  timestamp = {Mon, 06 Mar 2023 16:51:26 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2303-01580.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={AIGC}
}

@article{DBLP:journals/corr/abs-2303-07895,
  author    = {Noam Wies and
               Yoav Levine and
               Amnon Shashua},
  title     = {The Learnability of In-Context Learning},
  journal   = {CoRR},
  volume    = {abs/2303.07895},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2303.07895},
  doi       = {10.48550/arXiv.2303.07895},
  eprinttype = {arXiv},
  eprint    = {2303.07895},
  timestamp = {Mon, 20 Mar 2023 15:23:19 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2303-07895.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={In-Context Learning}
}

@article{DBLP:journals/corr/abs-2303-07616,
  author    = {Boxi Cao and
               Hongyu Lin and
               Xianpei Han and
               Le Sun},
  title     = {The Life Cycle of Knowledge in Big Language Models: {A} Survey},
  journal   = {CoRR},
  volume    = {abs/2303.07616},
  year      = {2023},
  url       = {https://doi.org/10.48550/arXiv.2303.07616},
  doi       = {10.48550/arXiv.2303.07616},
  eprinttype = {arXiv},
  eprint    = {2303.07616},
  timestamp = {Mon, 20 Mar 2023 15:23:19 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2303-07616.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Survey}
}

@inproceedings{DBLP:conf/cikm/LiKBKBMH22,
  author    = {Jiacheng Li and
               Yannis Katsis and
               Tyler Baldwin and
               Ho{-}Cheol Kim and
               Andrew Bartko and
               Julian J. McAuley and
               Chun{-}Nan Hsu},
  editor    = {Mohammad Al Hasan and
               Li Xiong},
  title     = {{SPOT:} Knowledge-Enhanced Language Representations for Information
               Extraction},
  booktitle = {CIKM},
  pages     = {1124--1134},
  publisher = {{ACM}},
  year      = {2022},
  url       = {https://doi.org/10.1145/3511808.3557459},
  doi       = {10.1145/3511808.3557459},
  timestamp = {Wed, 19 Oct 2022 17:09:02 +0200},
  biburl    = {https://dblp.org/rec/conf/cikm/LiKBKBMH22.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced, Information Extraction}
}

@article{DBLP:journals/corr/abs-2212-00975,
  author    = {Jinyoung Park and
               Hyeong Kyu Choi and
               Juyeon Ko and
               Hyeon{-}Jin Park and
               Ji{-}Hoon Kim and
               Jisu Jeong and
               Kyung{-}Min Kim and
               Hyunwoo J. Kim},
  title     = {Relation-aware Language-Graph Transformer for Question Answering},
  journal   = {CoRR},
  volume    = {abs/2212.00975},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2212.00975},
  doi       = {10.48550/arXiv.2212.00975},
  eprinttype = {arXiv},
  eprint    = {2212.00975},
  timestamp = {Thu, 08 Dec 2022 15:26:56 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2212-00975.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords={Knowledge Enhanced, Question Answering}
}

@misc{bian2023chatgpt,
      title={ChatGPT is a Knowledgeable but Inexperienced Solver: An Investigation of Commonsense Problem in Large Language Models},
      author={Ning Bian and Xianpei Han and Le Sun and Hongyu Lin and Yaojie Lu and Ben He},
      year={2023},
      journal   = {CoRR},
      eprint={2303.16421},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2303.16421},
      keywords={Evaluation}
}

@misc{wu2023bloomberggpt,
      title={BloombergGPT: A Large Language Model for Finance},
      author={Shijie Wu and Ozan Irsoy and Steven Lu and Vadim Dabravolski and Mark Dredze and Sebastian Gehrmann and Prabhanjan Kambadur and David Rosenberg and Gideon Mann},
      year={2023},
      eprint={2303.17564},
      archivePrefix={arXiv},
      primaryClass={cs.LG},
      url = {https://arxiv.org/abs/2303.17564},
      keywords={Application}
}

@article{DBLP:journals/corr/abs-2204-06031,
  author    = {Badr AlKhamissi and
               Millicent Li and
               Asli Celikyilmaz and
               Mona T. Diab and
               Marjan Ghazvininejad},
  title     = {A Review on Language Models as Knowledge Bases},
  journal   = {CoRR},
  volume    = {abs/2204.06031},
  year      = {2022},
  url       = {https://doi.org/10.48550/arXiv.2204.06031},
  doi       = {10.48550/arXiv.2204.06031},
  eprinttype = {arXiv},
  eprint    = {2204.06031},
  timestamp = {Thu, 22 Sep 2022 19:27:06 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2204-06031.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base, Survey}
}

@unknown{unknown,
author = {Fangzhen Lin and Ziyi Shou and Chengcai chen},
year = {2023},
month = {04},
pages = {},
title = {Using Language Models For Knowledge Acquisition in Natural Language Reasoning Problems},
url = {https://arxiv.org/pdf/2304.01771.pdf},
keywords = {Reasoning}
}

@article{DBLP:journals/corr/abs-2303-07839,
  author       = {Jules White and
                  Sam Hays and
                  Quchen Fu and
                  Jesse Spencer{-}Smith and
                  Douglas C. Schmidt},
  title        = {ChatGPT Prompt Patterns for Improving Code Quality, Refactoring, Requirements
                  Elicitation, and Software Design},
  journal      = {CoRR},
  volume       = {abs/2303.07839},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.07839},
  doi          = {10.48550/arXiv.2303.07839},
  eprinttype    = {arXiv},
  eprint       = {2303.07839},
  timestamp    = {Mon, 20 Mar 2023 15:23:19 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-07839.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2202-13169,
  author       = {Frank F. Xu and
                  Uri Alon and
                  Graham Neubig and
                  Vincent J. Hellendoorn},
  title        = {A Systematic Evaluation of Large Language Models of Code},
  journal      = {CoRR},
  volume       = {abs/2202.13169},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.13169},
  eprinttype    = {arXiv},
  eprint       = {2202.13169},
  timestamp    = {Wed, 02 Mar 2022 16:35:04 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-13169.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Program and Code Generation, Evaluation}
}

@article{DBLP:journals/corr/abs-2303-14524,
  author       = {Yunfan Gao and
                  Tao Sheng and
                  Youlin Xiang and
                  Yun Xiong and
                  Haofen Wang and
                  Jiawei Zhang},
  title        = {Chat-REC: Towards Interactive and Explainable LLMs-Augmented Recommender
                  System},
  journal      = {CoRR},
  volume       = {abs/2303.14524},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.14524},
  doi          = {10.48550/arXiv.2303.14524},
  eprinttype    = {arXiv},
  eprint       = {2303.14524},
  timestamp    = {Fri, 14 Apr 2023 17:38:15 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-14524.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Recommender System}
}


@misc{jang2023exploring,
      title={Exploring the Benefits of Training Expert Language Models over Instruction Tuning},
      author={Joel Jang and Seungone Kim and Seonghyeon Ye and Doyoung Kim and Lajanugen Logeswaran and Moontae Lee and Kyungjae Lee and Minjoon Seo},
      year={2023},
      eprint={2302.03202},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2302.03202},
      keywords = {Instruction Tuning}
}


@article{DBLP:journals/corr/abs-2304-10464,
  author       = {Yiduo Guo and
                  Yaobo Liang and
                  Chenfei Wu and
                  Wenshan Wu and
                  Dongyan Zhao and
                  Nan Duan},
  title        = {Learning to Program with Natural Language},
  journal      = {CoRR},
  volume       = {abs/2304.10464},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.10464},
  doi          = {10.48550/arXiv.2304.10464},
  eprinttype    = {arXiv},
  eprint       = {2304.10464},
  timestamp    = {Tue, 25 Apr 2023 17:14:23 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-10464.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords     = {Program Generation}
}

@article{DBLP:journals/corr/abs-2304-08354,
  author       = {Yujia Qin and
                  Shengding Hu and
                  Yankai Lin and
                  Weize Chen and
                  Ning Ding and
                  Ganqu Cui and
                  Zheni Zeng and
                  Yufei Huang and
                  Chaojun Xiao and
                  Chi Han and
                  Yi Ren Fung and
                  Yusheng Su and
                  Huadong Wang and
                  Cheng Qian and
                  Runchu Tian and
                  Kunlun Zhu and
                  Shihao Liang and
                  Xingyu Shen and
                  Bokai Xu and
                  Zhen Zhang and
                  Yining Ye and
                  Bowen Li and
                  Ziwei Tang and
                  Jing Yi and
                  Yuzhang Zhu and
                  Zhenning Dai and
                  Lan Yan and
                  Xin Cong and
                  Yaxi Lu and
                  Weilin Zhao and
                  Yuxiang Huang and
                  Junxi Yan and
                  Xu Han and
                  Xian Sun and
                  Dahai Li and
                  Jason Phang and
                  Cheng Yang and
                  Tongshuang Wu and
                  Heng Ji and
                  Zhiyuan Liu and
                  Maosong Sun},
  title        = {Tool Learning with Foundation Models},
  journal      = {CoRR},
  volume       = {abs/2304.08354},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.08354},
  doi          = {10.48550/arXiv.2304.08354},
  eprinttype    = {arXiv},
  eprint       = {2304.08354},
  timestamp    = {Fri, 21 Apr 2023 11:01:56 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-08354.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords     = {Program Generation}
}

@article{DBLP:journals/corr/abs-2304-09842,
  author       = {Pan Lu and
                  Baolin Peng and
                  Hao Cheng and
                  Michel Galley and
                  Kai{-}Wei Chang and
                  Ying Nian Wu and
                  Song{-}Chun Zhu and
                  Jianfeng Gao},
  title        = {Chameleon: Plug-and-Play Compositional Reasoning with Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2304.09842},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.09842},
  doi          = {10.48550/arXiv.2304.09842},
  eprinttype    = {arXiv},
  eprint       = {2304.09842},
  timestamp    = {Mon, 24 Apr 2023 15:03:18 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-09842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords     = {Program Generation}
}


@article{DBLP:journals/corr/abs-2304-07987,
  author       = {Ge Zhang and
                  Yemin Shi and
                  Ruibo Liu and
                  Ruibin Yuan and
                  Yizhi Li and
                  Siwei Dong and
                  Yu Shu and
                  Zhaoqun Li and
                  Zekun Wang and
                  Chenghua Lin and
                  Wenhao Huang and
                  Jie Fu},
  title        = {Chinese Open Instruction Generalist: {A} Preliminary Release},
  journal      = {CoRR},
  volume       = {abs/2304.07987},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.07987},
  doi          = {10.48550/arXiv.2304.07987},
  eprinttype    = {arXiv},
  eprint       = {2304.07987},
  timestamp    = {Fri, 21 Apr 2023 11:01:56 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-07987.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}


@article{DBLP:journals/corr/abs-2304-11116,
  author       = {Jiawei Zhang},
  title        = {Graph-ToolFormer: To Empower LLMs with Graph Reasoning Ability via
                  Prompt Augmented by ChatGPT},
  journal      = {CoRR},
  volume       = {abs/2304.11116},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.11116},
  doi          = {10.48550/arXiv.2304.11116},
  eprinttype    = {arXiv},
  eprint       = {2304.11116},
  timestamp    = {Tue, 02 May 2023 18:58:23 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-11116.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Prompt Engineering}
}

@article{DBLP:journals/corr/abs-2305-01555,
  author       = {Xin Xu and
                  Yuqi Zhu and
                  Xiaohan Wang and
                  Ningyu Zhang},
  title        = {How to Unleash the Power of Large Language Models for Few-shot Relation
                  Extraction?},
  journal      = {CoRR},
  volume       = {abs/2305.01555},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.01555},
  doi          = {10.48550/arXiv.2305.01555},
  eprinttype    = {arXiv},
  eprint       = {2305.01555},
  timestamp    = {Fri, 05 May 2023 14:35:02 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-01555.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Relation Extraction}
}


@article{DBLP:journals/corr/abs-2303-18223,
  author       = {Wayne Xin Zhao and
                  Kun Zhou and
                  Junyi Li and
                  Tianyi Tang and
                  Xiaolei Wang and
                  Yupeng Hou and
                  Yingqian Min and
                  Beichen Zhang and
                  Junjie Zhang and
                  Zican Dong and
                  Yifan Du and
                  Chen Yang and
                  Yushuo Chen and
                  Zhipeng Chen and
                  Jinhao Jiang and
                  Ruiyang Ren and
                  Yifan Li and
                  Xinyu Tang and
                  Zikang Liu and
                  Peiyu Liu and
                  Jian{-}Yun Nie and
                  Ji{-}Rong Wen},
  title        = {A Survey of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2303.18223},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.18223},
  doi          = {10.48550/arXiv.2303.18223},
  eprinttype    = {arXiv},
  eprint       = {2303.18223},
  timestamp    = {Mon, 17 Apr 2023 10:34:50 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-18223.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/csur/JiLFYSXIBMF23,
  author       = {Ziwei Ji and
                  Nayeon Lee and
                  Rita Frieske and
                  Tiezheng Yu and
                  Dan Su and
                  Yan Xu and
                  Etsuko Ishii and
                  Yejin Bang and
                  Andrea Madotto and
                  Pascale Fung},
  title        = {Survey of Hallucination in Natural Language Generation},
  journal      = {{ACM} Comput. Surv.},
  volume       = {55},
  number       = {12},
  pages        = {248:1--248:38},
  year         = {2023},
  url          = {https://doi.org/10.1145/3571730},
  doi          = {10.1145/3571730},
  timestamp    = {Fri, 02 Jun 2023 21:22:31 +0200},
  biburl       = {https://dblp.org/rec/journals/csur/JiLFYSXIBMF23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}


@article{DBLP:journals/corr/abs-2302-14691,
  author       = {Seonghyeon Ye and
                  Hyeonbin Hwang and
                  Sohee Yang and
                  Hyeongu Yun and
                  Yireun Kim and
                  Minjoon Seo},
  title        = {In-Context Instruction Learning},
  journal      = {CoRR},
  volume       = {abs/2302.14691},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.14691},
  doi          = {10.48550/arXiv.2302.14691},
  eprinttype    = {arXiv},
  eprint       = {2302.14691},
  timestamp    = {Thu, 02 Mar 2023 10:23:33 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-14691.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2302-11521,
  author       = {Simeng Sun and
                  Yang Liu and
                  Dan Iter and
                  Chenguang Zhu and
                  Mohit Iyyer},
  title        = {How Does In-Context Learning Help Prompt Tuning?},
  journal      = {CoRR},
  volume       = {abs/2302.11521},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.11521},
  doi          = {10.48550/arXiv.2302.11521},
  eprinttype    = {arXiv},
  eprint       = {2302.11521},
  timestamp    = {Fri, 24 Feb 2023 11:55:23 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-11521.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2304-10436,
  author       = {Hao Sun and
                  Zhexin Zhang and
                  Jiawen Deng and
                  Jiale Cheng and
                  Minlie Huang},
  title        = {Safety Assessment of Chinese Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2304.10436},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.10436},
  doi          = {10.48550/arXiv.2304.10436},
  eprinttype    = {arXiv},
  eprint       = {2304.10436},
  timestamp    = {Tue, 25 Apr 2023 17:14:23 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-10436.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Safety}
}

@article{DBLP:journals/corr/abs-2307-12966,
  author       = {Yufei Wang and
                  Wanjun Zhong and
                  Liangyou Li and
                  Fei Mi and
                  Xingshan Zeng and
                  Wenyong Huang and
                  Lifeng Shang and
                  Xin Jiang and
                  Qun Liu},
  title        = {Aligning Large Language Models with Human: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2307.12966},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.12966},
  doi          = {10.48550/arXiv.2307.12966},
  eprinttype    = {arXiv},
  eprint       = {2307.12966},
  timestamp    = {Tue, 01 Aug 2023 14:49:51 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-12966.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2307-04964,
  author       = {Rui Zheng and
                  Shihan Dou and
                  Songyang Gao and
                  Yuan Hua and
                  Wei Shen and
                  Binghai Wang and
                  Yan Liu and
                  Senjie Jin and
                  Qin Liu and
                  Yuhao Zhou and
                  Limao Xiong and
                  Lu Chen and
                  Zhiheng Xi and
                  Nuo Xu and
                  Wenbin Lai and
                  Minghao Zhu and
                  Cheng Chang and
                  Zhangyue Yin and
                  Rongxiang Weng and
                  Wensen Cheng and
                  Haoran Huang and
                  Tianxiang Sun and
                  Hang Yan and
                  Tao Gui and
                  Qi Zhang and
                  Xipeng Qiu and
                  Xuanjing Huang},
  title        = {Secrets of {RLHF} in Large Language Models Part {I:} {PPO}},
  journal      = {CoRR},
  volume       = {abs/2307.04964},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.04964},
  doi          = {10.48550/arXiv.2307.04964},
  eprinttype    = {arXiv},
  eprint       = {2307.04964},
  timestamp    = {Mon, 24 Jul 2023 16:32:58 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-04964.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {RLHF}
}

@article{DBLP:journals/corr/abs-2307-15217,
  author       = {Stephen Casper and
                  Xander Davies and
                  Claudia Shi and
                  Thomas Krendl Gilbert and
                  J{\'{e}}r{\'{e}}my Scheurer and
                  Javier Rando and
                  Rachel Freedman and
                  Tomasz Korbak and
                  David Lindner and
                  Pedro Freire and
                  Tony Wang and
                  Samuel Marks and
                  Charbel{-}Rapha{\"{e}}l S{\'{e}}gerie and
                  Micah Carroll and
                  Andi Peng and
                  Phillip J. K. Christoffersen and
                  Mehul Damani and
                  Stewart Slocum and
                  Usman Anwar and
                  Anand Siththaranjan and
                  Max Nadeau and
                  Eric J. Michaud and
                  Jacob Pfau and
                  Dmitrii Krasheninnikov and
                  Xin Chen and
                  Lauro Langosco and
                  Peter Hase and
                  Erdem Biyik and
                  Anca D. Dragan and
                  David Krueger and
                  Dorsa Sadigh and
                  Dylan Hadfield{-}Menell},
  title        = {Open Problems and Fundamental Limitations of Reinforcement Learning
                  from Human Feedback},
  journal      = {CoRR},
  volume       = {abs/2307.15217},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.15217},
  doi          = {10.48550/arXiv.2307.15217},
  eprinttype    = {arXiv},
  eprint       = {2307.15217},
  timestamp    = {Wed, 02 Aug 2023 15:37:53 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-15217.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {RLHF}
}

@article{DBLP:journals/corr/abs-2308-11432,
  author       = {Lei Wang and
                  Chen Ma and
                  Xueyang Feng and
                  Zeyu Zhang and
                  Hao Yang and
                  Jingsen Zhang and
                  Zhiyuan Chen and
                  Jiakai Tang and
                  Xu Chen and
                  Yankai Lin and
                  Wayne Xin Zhao and
                  Zhewei Wei and
                  Ji{-}Rong Wen},
  title        = {A Survey on Large Language Model based Autonomous Agents},
  journal      = {CoRR},
  volume       = {abs/2308.11432},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.11432},
  doi          = {10.48550/arXiv.2308.11432},
  eprinttype    = {arXiv},
  eprint       = {2308.11432},
  timestamp    = {Wed, 30 Aug 2023 17:27:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-11432.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2304-03277,
  author       = {Baolin Peng and
                  Chunyuan Li and
                  Pengcheng He and
                  Michel Galley and
                  Jianfeng Gao},
  title        = {Instruction Tuning with {GPT-4}},
  journal      = {CoRR},
  volume       = {abs/2304.03277},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.03277},
  doi          = {10.48550/arXiv.2304.03277},
  eprinttype    = {arXiv},
  eprint       = {2304.03277},
  timestamp    = {Tue, 18 Apr 2023 17:25:12 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-03277.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@article{ray2023chatgpt,
  title={ChatGPT: A comprehensive review on background, applications, key challenges, bias, ethics, limitations and future scope},
  author={Ray, Partha Pratim},
  journal={Internet of Things and Cyber-Physical Systems},
  year={2023},
  publisher={Elsevier},
  url = {https://www.sciencedirect.com/science/article/pii/S266734522300024X},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2305-15038,
  author       = {Liying Cheng and
                  Xingxuan Li and
                  Lidong Bing},
  title        = {Is {GPT-4} a Good Data Analyst?},
  journal      = {CoRR},
  volume       = {abs/2305.15038},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.15038},
  doi          = {10.48550/arXiv.2305.15038},
  eprinttype    = {arXiv},
  eprint       = {2305.15038},
  timestamp    = {Tue, 06 Jun 2023 18:10:43 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-15038.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Application}
}

@article{DBLP:journals/corr/abs-2308-10620,
  author       = {Xinyi Hou and
                  Yanjie Zhao and
                  Yue Liu and
                  Zhou Yang and
                  Kailong Wang and
                  Li Li and
                  Xiapu Luo and
                  David Lo and
                  John C. Grundy and
                  Haoyu Wang},
  title        = {Large Language Models for Software Engineering: {A} Systematic Literature
                  Review},
  journal      = {CoRR},
  volume       = {abs/2308.10620},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.10620},
  doi          = {10.48550/arXiv.2308.10620},
  eprinttype    = {arXiv},
  eprint       = {2308.10620},
  timestamp    = {Thu, 31 Aug 2023 10:19:30 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-10620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2308-09687,
  author       = {Maciej Besta and
                  Nils Blach and
                  Ales Kubicek and
                  Robert Gerstenberger and
                  Lukas Gianinazzi and
                  Joanna Gajda and
                  Tomasz Lehmann and
                  Michal Podstawski and
                  Hubert Niewiadomski and
                  Piotr Nyczyk and
                  Torsten Hoefler},
  title        = {Graph of Thoughts: Solving Elaborate Problems with Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2308.09687},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.09687},
  doi          = {10.48550/arXiv.2308.09687},
  eprinttype    = {arXiv},
  eprint       = {2308.09687},
  timestamp    = {Fri, 25 Aug 2023 11:24:49 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-09687.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2308-07902,
  author       = {Ziyu Zhuang and
                  Qiguang Chen and
                  Longxuan Ma and
                  Mingda Li and
                  Yi Han and
                  Yushan Qian and
                  Haopeng Bai and
                  Zixian Feng and
                  Weinan Zhang and
                  Ting Liu},
  title        = {Through the Lens of Core Competency: Survey on Evaluation of Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2308.07902},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.07902},
  doi          = {10.48550/arXiv.2308.07902},
  eprinttype    = {arXiv},
  eprint       = {2308.07902},
  timestamp    = {Wed, 23 Aug 2023 14:43:32 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-07902.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Evaluation}
}

@article{DBLP:journals/corr/abs-2303-13217,
  author       = {Huan Ma and
                  Changqing Zhang and
                  Yatao Bian and
                  Lemao Liu and
                  Zhirui Zhang and
                  Peilin Zhao and
                  Shu Zhang and
                  Huazhu Fu and
                  Qinghua Hu and
                  Bingzhe Wu},
  title        = {Fairness-guided Few-shot Prompting for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2303.13217},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.13217},
  doi          = {10.48550/arXiv.2303.13217},
  eprinttype    = {arXiv},
  eprint       = {2303.13217},
  timestamp    = {Thu, 13 Apr 2023 17:40:16 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-13217.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2305-17306,
  author       = {Yao Fu and
                  Litu Ou and
                  Mingyu Chen and
                  Yuhao Wan and
                  Hao Peng and
                  Tushar Khot},
  title        = {Chain-of-Thought Hub: {A} Continuous Effort to Measure Large Language
                  Models' Reasoning Performance},
  journal      = {CoRR},
  volume       = {abs/2305.17306},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.17306},
  doi          = {10.48550/arXiv.2305.17306},
  eprinttype    = {arXiv},
  eprint       = {2305.17306},
  timestamp    = {Tue, 13 Jun 2023 11:58:39 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-17306.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Evaluation}
}

@article{DBLP:journals/corr/abs-2305-13903,
  author       = {Vaishnavi Himakunthala and
                  Andy Ouyang and
                  Daniel Rose and
                  Ryan He and
                  Alex Mei and
                  Yujie Lu and
                  Chinmay Sonar and
                  Michael Saxon and
                  William Yang Wang},
  title        = {Let's Think Frame by Frame: Evaluating Video Chain of Thought with
                  Video Infilling and Prediction},
  journal      = {CoRR},
  volume       = {abs/2305.13903},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.13903},
  doi          = {10.48550/arXiv.2305.13903},
  eprinttype    = {arXiv},
  eprint       = {2305.13903},
  timestamp    = {Mon, 05 Jun 2023 15:42:15 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-13903.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Multimodal}
}

@inproceedings{DBLP:conf/icml/KandpalDRWR23,
  author       = {Nikhil Kandpal and
                  Haikang Deng and
                  Adam Roberts and
                  Eric Wallace and
                  Colin Raffel},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Large Language Models Struggle to Learn Long-Tail Knowledge},
  booktitle    = {ICML},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {15696--15707},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/kandpal23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KandpalDRWR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/acl/CaoLHSYLXX20,
  author       = {Boxi Cao and
                  Hongyu Lin and
                  Xianpei Han and
                  Le Sun and
                  Lingyong Yan and
                  Meng Liao and
                  Tong Xue and
                  Jin Xu},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Knowledgeable or Educated Guess? Revisiting Language Models as Knowledge
                  Bases},
  booktitle    = {ACL},
  pages        = {1860--1874},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.146},
  doi          = {10.18653/v1/2021.acl-long.146},
  timestamp    = {Thu, 31 Aug 2023 08:17:29 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/CaoLHSYLXX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
  }

@inproceedings{DBLP:conf/acl/BlevinsGZ23,
  author       = {Terra Blevins and
                  Hila Gonen and
                  Luke Zettlemoyer},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Prompting Language Models for Linguistic Structure},
  booktitle    = {ACL},
  pages        = {6649--6663},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.367},
  doi          = {10.18653/v1/2023.acl-long.367},
  timestamp    = {Thu, 10 Aug 2023 12:35:50 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/BlevinsGZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/tacl/DhingraCEGEC22,
  author       = {Bhuwan Dhingra and
                  Jeremy R. Cole and
                  Julian Martin Eisenschlos and
                  Daniel Gillick and
                  Jacob Eisenstein and
                  William W. Cohen},
  title        = {Time-Aware Language Models as Temporal Knowledge Bases},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {10},
  pages        = {257--273},
  year         = {2022},
  url          = {https://doi.org/10.1162/tacl\_a\_00459},
  doi          = {10.1162/tacl\_a\_00459},
  timestamp    = {Wed, 29 Jun 2022 16:03:22 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/DhingraCEGEC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2308-04014,
  author       = {Kshitij Gupta and
                  Benjamin Th{\'{e}}rien and
                  Adam Ibrahim and
                  Mats L. Richter and
                  Quentin Anthony and
                  Eugene Belilovsky and
                  Irina Rish and
                  Timoth{\'{e}}e Lesort},
  title        = {Continual Pre-Training of Large Language Models: How to (re)warm your
                  model?},
  journal      = {CoRR},
  volume       = {abs/2308.04014},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.04014},
  doi          = {10.48550/arXiv.2308.04014},
  eprinttype    = {arXiv},
  eprint       = {2308.04014},
  timestamp    = {Tue, 22 Aug 2023 13:58:15 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-04014.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Continual Learning}
}


@inproceedings{DBLP:conf/iclr/KeSLKK023,
  author       = {Zixuan Ke and
                  Yijia Shao and
                  Haowei Lin and
                  Tatsuya Konishi and
                  Gyuhak Kim and
                  Bing Liu},
  title        = {Continual Pre-training of Language Models},
  booktitle    = {ICLR},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=m\_GDIItaI3o},
  timestamp    = {Fri, 30 Jun 2023 14:55:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KeSLKK023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Continual Learning}
}

@article{DBLP:journals/corr/abs-2208-11057,
  author       = {Dimitrios Alivanistos and
                  Selene Baez Santamar{\'{\i}}a and
                  Michael Cochez and
                  Jan{-}Christoph Kalo and
                  Emile van Krieken and
                  Thiviyan Thanapalasingam},
  title        = {Prompting as Probing: Using Language Models for Knowledge Base Construction},
  journal      = {CoRR},
  volume       = {abs/2208.11057},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.11057},
  doi          = {10.48550/arXiv.2208.11057},
  eprinttype    = {arXiv},
  eprint       = {2208.11057},
  timestamp    = {Mon, 29 Aug 2022 15:51:41 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-11057.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/eacl/CohenGBG23,
  author       = {Roi Cohen and
                  Mor Geva and
                  Jonathan Berant and
                  Amir Globerson},
  editor       = {Andreas Vlachos and
                  Isabelle Augenstein},
  title        = {Crawling The Internal Knowledge-Base of Language Models},
  booktitle    = {EACL},
  pages        = {1811--1824},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.findings-eacl.139},
  timestamp    = {Mon, 08 May 2023 14:38:37 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/CohenGBG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}


@inproceedings{DBLP:conf/emnlp/SungLYJKK21,
  author       = {Mujeen Sung and
                  Jinhyuk Lee and
                  Sean S. Yi and
                  Minji Jeon and
                  Sungdong Kim and
                  Jaewoo Kang},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Can Language Models be Biomedical Knowledge Bases?},
  booktitle    = {EMNLP},
  pages        = {4723--4734},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.388},
  doi          = {10.18653/v1/2021.emnlp-main.388},
  timestamp    = {Thu, 20 Jan 2022 10:02:30 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/SungLYJKK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2306-06264,
  author       = {Pouya Pezeshkpour},
  title        = {Measuring and Modifying Factual Knowledge in Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2306.06264},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.06264},
  doi          = {10.48550/arXiv.2306.06264},
  eprinttype    = {arXiv},
  eprint       = {2306.06264},
  timestamp    = {Fri, 16 Jun 2023 12:41:12 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-06264.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2306-08302,
  author       = {Shirui Pan and
                  Linhao Luo and
                  Yufei Wang and
                  Chen Chen and
                  Jiapu Wang and
                  Xindong Wu},
  title        = {Unifying Large Language Models and Knowledge Graphs: {A} Roadmap},
  journal      = {CoRR},
  volume       = {abs/2306.08302},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.08302},
  doi          = {10.48550/arXiv.2306.08302},
  eprinttype    = {arXiv},
  eprint       = {2306.08302},
  timestamp    = {Sun, 18 Jun 2023 16:10:59 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-08302.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/ijautcomp/ZhangRHJ23,
  author       = {Liang Zhang and
                  Ludan Ruan and
                  Anwen Hu and
                  Qin Jin},
  title        = {Multimodal Pretraining from Monolingual to Multilingual},
  journal      = {Mach. Intell. Res.},
  volume       = {20},
  number       = {2},
  pages        = {220--232},
  year         = {2023},
  url          = {https://doi.org/10.1007/s11633-022-1414-4},
  doi          = {10.1007/s11633-022-1414-4},
  timestamp    = {Sat, 29 Apr 2023 19:26:35 +0200},
  biburl       = {https://dblp.org/rec/journals/ijautcomp/ZhangRHJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Multimodal}
}

@article{DBLP:journals/ijautcomp/HuHZ23,
  author       = {Guyue Hu and
                  Bin He and
                  Hanwang Zhang},
  title        = {Compositional Prompting Video-language Models to Understand Procedure
                  in Instructional Videos},
  journal      = {Mach. Intell. Res.},
  volume       = {20},
  number       = {2},
  pages        = {249--262},
  year         = {2023},
  url          = {https://doi.org/10.1007/s11633-022-1409-1},
  doi          = {10.1007/s11633-022-1409-1},
  timestamp    = {Sat, 29 Apr 2023 19:26:35 +0200},
  biburl       = {https://dblp.org/rec/journals/ijautcomp/HuHZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Multimodal}
}

@article{DBLP:journals/ijautcomp/GuWSSKZZYLZH23,
  author       = {Yuxian Gu and
                  Jiaxin Wen and
                  Hao Sun and
                  Yi Song and
                  Pei Ke and
                  Chujie Zheng and
                  Zheng Zhang and
                  Jianzhu Yao and
                  Lei Liu and
                  Xiaoyan Zhu and
                  Minlie Huang},
  title        = {{EVA2.0:} Investigating Open-domain Chinese Dialogue Systems with
                  Large-scale Pre-training},
  journal      = {Mach. Intell. Res.},
  volume       = {20},
  number       = {2},
  pages        = {207--219},
  year         = {2023},
  url          = {https://doi.org/10.1007/s11633-022-1387-3},
  doi          = {10.1007/s11633-022-1387-3},
  timestamp    = {Mon, 01 May 2023 13:02:33 +0200},
  biburl       = {https://dblp.org/rec/journals/ijautcomp/GuWSSKZZYLZH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Dialogue System}
}

@inproceedings{DBLP:conf/acl/LiTZWNW23,
  author       = {Junyi Li and
                  Tianyi Tang and
                  Wayne Xin Zhao and
                  Jingyuan Wang and
                  Jian{-}Yun Nie and
                  Ji{-}Rong Wen},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {The Web Can Be Your Oyster for Improving Language Models},
  booktitle    = {ACL},
  pages        = {728--746},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.46},
  doi          = {10.18653/v1/2023.findings-acl.46},
  timestamp    = {Thu, 10 Aug 2023 12:35:43 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiTZWNW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Retrieval-Augmented Language Model}
}

@inproceedings{DBLP:conf/acl/GaoZLZW23,
  author       = {Ze{-}Feng Gao and
                  Kun Zhou and
                  Peiyu Liu and
                  Wayne Xin Zhao and
                  Ji{-}Rong Wen},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Small Pre-trained Language Models Can be Fine-tuned as Large Models
                  via Over-Parameterization},
  booktitle    = {ACL},
  pages        = {3819--3834},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.212},
  doi          = {10.18653/v1/2023.acl-long.212},
  timestamp    = {Thu, 10 Aug 2023 12:35:46 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/GaoZLZW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Continual Learning}
}

@article{DBLP:journals/corr/abs-2305-07001,
  author       = {Junjie Zhang and
                  Ruobing Xie and
                  Yupeng Hou and
                  Wayne Xin Zhao and
                  Leyu Lin and
                  Ji{-}Rong Wen},
  title        = {Recommendation as Instruction Following: {A} Large Language Model
                  Empowered Recommendation Approach},
  journal      = {CoRR},
  volume       = {abs/2305.07001},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.07001},
  doi          = {10.48550/arXiv.2305.07001},
  eprinttype    = {arXiv},
  eprint       = {2305.07001},
  timestamp    = {Wed, 17 May 2023 15:47:36 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-07001.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Recommender System}
}


@article{DBLP:journals/corr/abs-2308-07107,
  author       = {Yutao Zhu and
                  Huaying Yuan and
                  Shuting Wang and
                  Jiongnan Liu and
                  Wenhan Liu and
                  Chenlong Deng and
                  Zhicheng Dou and
                  Ji{-}Rong Wen},
  title        = {Large Language Models for Information Retrieval: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2308.07107},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.07107},
  doi          = {10.48550/arXiv.2308.07107},
  eprinttype    = {arXiv},
  eprint       = {2308.07107},
  timestamp    = {Wed, 23 Aug 2023 14:43:32 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-07107.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}


@article{DBLP:journals/corr/abs-2305-14128,
  author       = {Man Luo and
                  Xin Xu and
                  Zhuyun Dai and
                  Panupong Pasupat and
                  Seyed Mehran Kazemi and
                  Chitta Baral and
                  Vaiva Imbrasaite and
                  Vincent Y. Zhao},
  title        = {Dr.ICL: Demonstration-Retrieved In-context Learning},
  journal      = {CoRR},
  volume       = {abs/2305.14128},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14128},
  doi          = {10.48550/arXiv.2305.14128},
  eprinttype    = {arXiv},
  eprint       = {2305.14128},
  timestamp    = {Mon, 05 Jun 2023 15:42:15 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14128.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@inproceedings{DBLP:conf/acl/LiLYLZNXWQ23,
  author       = {Xiaonan Li and
                  Kai Lv and
                  Hang Yan and
                  Tianyang Lin and
                  Wei Zhu and
                  Yuan Ni and
                  Guotong Xie and
                  Xiaoling Wang and
                  Xipeng Qiu},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Unified Demonstration Retriever for In-Context Learning},
  booktitle    = {ACL},
  pages        = {4644--4668},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.256},
  doi          = {10.18653/v1/2023.acl-long.256},
  timestamp    = {Thu, 10 Aug 2023 12:35:46 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiLYLZNXWQ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2306-11489,
  author       = {Linyao Yang and
                  Hongyang Chen and
                  Zhao Li and
                  Xiao Ding and
                  Xindong Wu},
  title        = {ChatGPT is not Enough: Enhancing Large Language Models with Knowledge
                  Graphs for Fact-aware Language Modeling},
  journal      = {CoRR},
  volume       = {abs/2306.11489},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.11489},
  doi          = {10.48550/arXiv.2306.11489},
  eprinttype    = {arXiv},
  eprint       = {2306.11489},
  timestamp    = {Fri, 23 Jun 2023 15:19:11 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-11489.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2307-16648,
  author       = {Hamed Babaei Giglou and
                  Jennifer D'Souza and
                  S{\"{o}}ren Auer},
  title        = {LLMs4OL: Large Language Models for Ontology Learning},
  journal      = {CoRR},
  volume       = {abs/2307.16648},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.16648},
  doi          = {10.48550/arXiv.2307.16648},
  eprinttype    = {arXiv},
  eprint       = {2307.16648},
  timestamp    = {Wed, 02 Aug 2023 15:37:53 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-16648.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Generation}
}

@article{DBLP:journals/corr/abs-2302-01150,
  author       = {Simon Gottschalk and
                  Elena Demidova},
  title        = {Tab2KG: Semantic Table Interpretation with Lightweight Semantic Profiles},
  journal      = {CoRR},
  volume       = {abs/2302.01150},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.01150},
  doi          = {10.48550/arXiv.2302.01150},
  eprinttype    = {arXiv},
  eprint       = {2302.01150},
  timestamp    = {Thu, 09 Feb 2023 16:11:17 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-01150.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Generation}
}

@inproceedings{DBLP:conf/acl/LoganLPGS19,
  author       = {Robert L. Logan IV and
                  Nelson F. Liu and
                  Matthew E. Peters and
                  Matt Gardner and
                  Sameer Singh},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Barack's Wife Hillary: Using Knowledge Graphs for Fact-Aware Language
                  Modeling},
  booktitle    = {ACL},
  pages        = {5962--5971},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1598},
  doi          = {10.18653/v1/p19-1598},
  timestamp    = {Fri, 06 Aug 2021 00:41:01 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LoganLPGS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Enhanced}
}

@inproceedings{DBLP:conf/emnlp/AggarwalSP22,
  author       = {Arshiya Aggarwal and
                  Jiao Sun and
                  Nanyun Peng},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {Towards Robust {NLG} Bias Evaluation with Syntactically-diverse Prompts},
  booktitle    = {EMNLP},
  pages        = {6022--6032},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.445},
  doi          = {10.18653/v1/2022.findings-emnlp.445},
  timestamp    = {Thu, 10 Aug 2023 12:35:36 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/AggarwalSP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Evaluation}
}


@inproceedings{DBLP:conf/acl/WangXLHLLL23,
  author       = {Lei Wang and
                  Wanyu Xu and
                  Yihuai Lan and
                  Zhiqiang Hu and
                  Yunshi Lan and
                  Roy Ka{-}Wei Lee and
                  Ee{-}Peng Lim},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Plan-and-Solve Prompting: Improving Zero-Shot Chain-of-Thought Reasoning
                  by Large Language Models},
  booktitle    = {ACL},
  pages        = {2609--2634},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.147},
  doi          = {10.18653/v1/2023.acl-long.147},
  timestamp    = {Fri, 25 Aug 2023 08:01:11 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WangXLHLLL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}


@article{DBLP:journals/corr/abs-2305-08291,
  author       = {Jieyi Long},
  title        = {Large Language Model Guided Tree-of-Thought},
  journal      = {CoRR},
  volume       = {abs/2305.08291},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.08291},
  doi          = {10.48550/arXiv.2305.08291},
  eprinttype    = {arXiv},
  eprint       = {2305.08291},
  timestamp    = {Wed, 17 May 2023 15:47:36 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-08291.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@inproceedings{DBLP:conf/acl/YuanYLTLXX23,
  author       = {Siyu Yuan and
                  Deqing Yang and
                  Jinxi Liu and
                  Shuyu Tian and
                  Jiaqing Liang and
                  Yanghua Xiao and
                  Rui Xie},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Causality-aware Concept Extraction based on Knowledge-guided Prompting},
  booktitle    = {ACL},
  pages        = {9255--9272},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.514},
  doi          = {10.18653/v1/2023.acl-long.514},
  timestamp    = {Thu, 10 Aug 2023 12:35:47 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YuanYLTLXX23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@inproceedings{DBLP:conf/acl/WadhwaAW23,
  author       = {Somin Wadhwa and
                  Silvio Amir and
                  Byron C. Wallace},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Revisiting Relation Extraction in the era of Large Language Models},
  booktitle    = {ACL},
  pages        = {15566--15589},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.868},
  doi          = {10.18653/v1/2023.acl-long.868},
  timestamp    = {Thu, 10 Aug 2023 12:36:01 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WadhwaAW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2305-14450,
  author       = {Ridong Han and
                  Tao Peng and
                  Chaohao Yang and
                  Benyou Wang and
                  Lu Liu and
                  Xiang Wan},
  title        = {Is Information Extraction Solved by ChatGPT? An Analysis of Performance,
                  Evaluation Criteria, Robustness and Errors},
  journal      = {CoRR},
  volume       = {abs/2305.14450},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14450},
  doi          = {10.48550/arXiv.2305.14450},
  eprinttype    = {arXiv},
  eprint       = {2305.14450},
  timestamp    = {Fri, 04 Aug 2023 08:25:39 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14450.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2309-00267,
  author       = {Harrison Lee and
                  Samrat Phatale and
                  Hassan Mansoor and
                  Kellie Lu and
                  Thomas Mesnard and
                  Colton Bishop and
                  Victor Carbune and
                  Abhinav Rastogi},
  title        = {{RLAIF:} Scaling Reinforcement Learning from Human Feedback with {AI}
                  Feedback},
  journal      = {CoRR},
  volume       = {abs/2309.00267},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.00267},
  doi          = {10.48550/arXiv.2309.00267},
  eprinttype    = {arXiv},
  eprint       = {2309.00267},
  timestamp    = {Mon, 11 Sep 2023 16:01:35 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-00267.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {RLHF}
}

@article{lin2023speciality,
  title={Speciality vs Generality: An Empirical Study on Catastrophic Forgetting in Fine-tuning Foundation Models},
  author={Lin, Yong and Tan, Lu and Lin, Hangyu and Zheng, Zeming and Pi, Renjie and Zhang, Jipeng and Diao, Shizhe and Wang, Haoxiang and Zhao, Han and Yao, Yuan and others},
  journal={arXiv preprint arXiv:2309.06256},
  year={2023},
  url={https://arxiv.org/pdf/2309.06256.pdf},
  keywords = {Continual Learning}
}

@inproceedings{DBLP:conf/acl/Chen0LLJDWCH023,
  author       = {Jiawei Chen and
                  Yaojie Lu and
                  Hongyu Lin and
                  Jie Lou and
                  Wei Jia and
                  Dai Dai and
                  Hua Wu and
                  Boxi Cao and
                  Xianpei Han and
                  Le Sun},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Learning In-context Learning for Named Entity Recognition},
  booktitle    = {ACL},
  pages        = {13661--13675},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.764},
  doi          = {10.18653/v1/2023.acl-long.764},
  timestamp    = {Thu, 10 Aug 2023 12:35:44 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Chen0LLJDWCH023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords  = {Information Extraction}
}


@article{DBLP:journals/corr/abs-2309-03118,
  author       = {Chao Feng and
                  Xinyu Zhang and
                  Zichu Fei},
  title        = {Knowledge Solver: Teaching LLMs to Search for Domain Knowledge from
                  Knowledge Graphs},
  journal      = {CoRR},
  volume       = {abs/2309.03118},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.03118},
  doi          = {10.48550/arXiv.2309.03118},
  eprinttype    = {arXiv},
  eprint       = {2309.03118},
  timestamp    = {Tue, 12 Sep 2023 12:50:52 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-03118.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Retrieval-Augmented Language Models}
}

@inproceedings{DBLP:conf/esws/Khorashadizadeh23,
  author       = {Hanieh Khorashadizadeh and
                  Nandana Mihindukulasooriya and
                  Sanju Tiwari and
                  Jinghua Groppe and
                  Sven Groppe},
  editor       = {Sanju Tiwari and
                  Nandana Mihindukulasooriya and
                  Francesco Osborne and
                  Dimitris Kontokostas and
                  Jennifer D'Souza and
                  Mayank Kejriwal and
                  Edgard Marx},
  title        = {Exploring In-Context Learning Capabilities of Foundation Models for
                  Generating Knowledge Graphs from Text},
  booktitle    = {ESWC},
  series       = {{CEUR} Workshop Proceedings},
  volume       = {3447},
  pages        = {132--153},
  publisher    = {CEUR-WS.org},
  year         = {2023},
  url          = {https://ceur-ws.org/Vol-3447/Text2KG\_Paper\_9.pdf},
  timestamp    = {Thu, 03 Aug 2023 16:22:08 +0200},
  biburl       = {https://dblp.org/rec/conf/esws/Khorashadizadeh23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
  }

  @inproceedings{DBLP:conf/acl/WhitehouseVA0P23,
  author       = {Chenxi Whitehouse and
                  Clara Vania and
                  Alham Fikri Aji and
                  Christos Christodoulopoulos and
                  Andrea Pierleoni},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {WebIE: Faithful and Robust Information Extraction on the Web},
  booktitle    = {ACL},
  pages        = {7734--7755},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.428},
  doi          = {10.18653/v1/2023.acl-long.428},
  timestamp    = {Thu, 10 Aug 2023 12:36:01 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WhitehouseVA0P23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2307-03109,
  author       = {Yupeng Chang and
                  Xu Wang and
                  Jindong Wang and
                  Yuan Wu and
                  Kaijie Zhu and
                  Hao Chen and
                  Linyi Yang and
                  Xiaoyuan Yi and
                  Cunxiang Wang and
                  Yidong Wang and
                  Wei Ye and
                  Yue Zhang and
                  Yi Chang and
                  Philip S. Yu and
                  Qiang Yang and
                  Xing Xie},
  title        = {A Survey on Evaluation of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2307.03109},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.03109},
  doi          = {10.48550/arXiv.2307.03109},
  eprinttype    = {arXiv},
  eprint       = {2307.03109},
  timestamp    = {Wed, 06 Sep 2023 17:49:05 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-03109.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2307-01137,
  author       = {Qinyong Wang and
                  Zhenxiang Gao and
                  Rong Xu},
  title        = {Exploring the In-context Learning Ability of Large Language Model
                  for Biomedical Concept Linking},
  journal      = {CoRR},
  volume       = {abs/2307.01137},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.01137},
  doi          = {10.48550/arXiv.2307.01137},
  eprinttype    = {arXiv},
  eprint       = {2307.01137},
  timestamp    = {Mon, 10 Jul 2023 17:27:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-01137.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2307-03393,
  author       = {Zhikai Chen and
                  Haitao Mao and
                  Hang Li and
                  Wei Jin and
                  Hongzhi Wen and
                  Xiaochi Wei and
                  Shuaiqiang Wang and
                  Dawei Yin and
                  Wenqi Fan and
                  Hui Liu and
                  Jiliang Tang},
  title        = {Exploring the Potential of Large Language Models (LLMs) in Learning
                  on Graphs},
  journal      = {CoRR},
  volume       = {abs/2307.03393},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.03393},
  doi          = {10.48550/arXiv.2307.03393},
  eprinttype    = {arXiv},
  eprint       = {2307.03393},
  timestamp    = {Tue, 11 Jul 2023 09:58:52 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-03393.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Graph Learning}
}

@article{DBLP:journals/corr/abs-2308-07134,
  author       = {Ruosong Ye and
                  Caiqi Zhang and
                  Runhui Wang and
                  Shuyuan Xu and
                  Yongfeng Zhang},
  title        = {Natural Language is All a Graph Needs},
  journal      = {CoRR},
  volume       = {abs/2308.07134},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.07134},
  doi          = {10.48550/arXiv.2308.07134},
  eprinttype    = {arXiv},
  eprint       = {2308.07134},
  timestamp    = {Wed, 23 Aug 2023 14:43:32 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-07134.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Graph Learning}
}


@article{DBLP:journals/corr/abs-2308-14522,
  author       = {Ziwei Zhang and
                  Haoyang Li and
                  Zeyang Zhang and
                  Yijian Qin and
                  Xin Wang and
                  Wenwu Zhu},
  title        = {Large Graph Models: {A} Perspective},
  journal      = {CoRR},
  volume       = {abs/2308.14522},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.14522},
  doi          = {10.48550/arXiv.2308.14522},
  eprinttype    = {arXiv},
  eprint       = {2308.14522},
  timestamp    = {Fri, 01 Sep 2023 15:21:30 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-14522.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Graph Learning}
}

@article{DBLP:journals/corr/abs-2309-04565,
  author       = {Lanning Wei and
                  Zhiqiang He and
                  Huan Zhao and
                  Quanming Yao},
  title        = {Unleashing the Power of Graph Learning through LLM-based Autonomous
                  Agents},
  journal      = {CoRR},
  volume       = {abs/2309.04565},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.04565},
  doi          = {10.48550/arXiv.2309.04565},
  eprinttype    = {arXiv},
  eprint       = {2309.04565},
  timestamp    = {Fri, 15 Sep 2023 12:26:52 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-04565.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Graph Learning}
}

@inproceedings{DBLP:conf/emnlp/GevaSBL21,
  author       = {Mor Geva and
                  Roei Schuster and
                  Jonathan Berant and
                  Omer Levy},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Transformer Feed-Forward Layers Are Key-Value Memories},
  booktitle    = {EMNLP},
  pages        = {5484--5495},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.446},
  doi          = {10.18653/v1/2021.emnlp-main.446},
  timestamp    = {Thu, 20 Jan 2022 10:02:18 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/GevaSBL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Storage and Locating}
}


@article{DBLP:journals/corr/abs-2301-10405,
  author       = {Siyuan Cheng and
                  Ningyu Zhang and
                  Bozhong Tian and
                  Zelin Dai and
                  Feiyu Xiong and
                  Wei Guo and
                  Huajun Chen},
  title        = {Editing Language Model-based Knowledge Graph Embeddings},
  journal      = {CoRR},
  volume       = {abs/2301.10405},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.10405},
  doi          = {10.48550/arXiv.2301.10405},
  eprinttype    = {arXiv},
  eprint       = {2301.10405},
  timestamp    = {Thu, 26 Jan 2023 17:49:16 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-10405.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}


@article{DBLP:journals/corr/abs-2308-13198,
  author       = {Yuheng Chen and
                  Pengfei Cao and
                  Yubo Chen and
                  Kang Liu and
                  Jun Zhao},
  title        = {Journey to the Center of the Knowledge Neurons: Discoveries of Language-Independent
                  Knowledge Neurons and Degenerate Knowledge Neurons},
  journal      = {CoRR},
  volume       = {abs/2308.13198},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.13198},
  doi          = {10.48550/arXiv.2308.13198},
  eprinttype    = {arXiv},
  eprint       = {2308.13198},
  timestamp    = {Fri, 01 Sep 2023 14:25:01 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-13198.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Storage and Locating}
}


@article{DBLP:journals/corr/abs-2308-08742,
  author       = {Xiaopeng Li and
                  Shasha Li and
                  Shezheng Song and
                  Jing Yang and
                  Jun Ma and
                  Jie Yu},
  title        = {{PMET:} Precise Model Editing in a Transformer},
  journal      = {CoRR},
  volume       = {abs/2308.08742},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.08742},
  doi          = {10.48550/arXiv.2308.08742},
  eprinttype    = {arXiv},
  eprint       = {2308.08742},
  timestamp    = {Fri, 25 Aug 2023 11:24:49 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-08742.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}

@inproceedings{DBLP:conf/icml/MainiMSLKZ23,
  author       = {Pratyush Maini and
                  Michael Curtis Mozer and
                  Hanie Sedghi and
                  Zachary Chase Lipton and
                  J. Zico Kolter and
                  Chiyuan Zhang},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Can Neural Network Memorization Be Localized?},
  booktitle    = {ICML},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {23536--23557},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/maini23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MainiMSLKZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Storage and Locating}
}

@article{DBLP:journals/corr/abs-2305-14795,
  author       = {Zexuan Zhong and
                  Zhengxuan Wu and
                  Christopher D. Manning and
                  Christopher Potts and
                  Danqi Chen},
  title        = {MQuAKE: Assessing Knowledge Editing in Language Models via Multi-Hop
                  Questions},
  journal      = {CoRR},
  volume       = {abs/2305.14795},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14795},
  doi          = {10.48550/arXiv.2305.14795},
  eprinttype    = {arXiv},
  eprint       = {2305.14795},
  timestamp    = {Tue, 06 Jun 2023 18:10:43 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14795.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}


@article{DBLP:journals/corr/abs-2308-14177,
  author       = {Lin Geng Foo and
                  Hossein Rahmani and
                  Jun Liu},
  title        = {{AIGC} for Various Data Modalities: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2308.14177},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.14177},
  doi          = {10.48550/arXiv.2308.14177},
  eprinttype    = {arXiv},
  eprint       = {2308.14177},
  timestamp    = {Fri, 01 Sep 2023 14:25:01 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-14177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}


@article{ling2023domain,
  title={Domain specialization as the key to make large language models disruptive: A comprehensive survey},
  author={Ling, Chen and Zhao, Xujiang and Lu, Jiaying and Deng, Chengyuan and Zheng, Can and Wang, Junxiang and Chowdhury, Tanmoy and Li, Yun and Cui, Hejie and Zhao, Tianjiao and others},
  journal={arXiv preprint arXiv:2305.18703},
  year={2023},
  url = {https://arxiv.org/pdf/2305.18703.pdf},
  keywords = {Survey}
}

@inproceedings{DBLP:conf/acl/Hoelscher-Obermaier23,
  author       = {Jason Hoelscher{-}Obermaier and
                  Julia Persson and
                  Esben Kran and
                  Ioannis Konstas and
                  Fazl Barez},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Detecting Edit Failures In Large Language Models: An Improved Specificity
                  Benchmark},
  booktitle    = {ACL},
  pages        = {11548--11559},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.733},
  doi          = {10.18653/v1/2023.findings-acl.733},
  timestamp    = {Thu, 10 Aug 2023 12:35:52 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Hoelscher-Obermaier23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}

@article{DBLP:journals/tacl/ElazarKRRHSG21,
  author       = {Yanai Elazar and
                  Nora Kassner and
                  Shauli Ravfogel and
                  Abhilasha Ravichander and
                  Eduard H. Hovy and
                  Hinrich Sch{\"{u}}tze and
                  Yoav Goldberg},
  title        = {Measuring and Improving Consistency in Pretrained Language Models},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {9},
  pages        = {1012--1031},
  year         = {2021},
  url          = {https://doi.org/10.1162/tacl\_a\_00410},
  doi          = {10.1162/tacl\_a\_00410},
  timestamp    = {Wed, 07 Dec 2022 23:05:10 +0100},
  biburl       = {https://dblp.org/rec/journals/tacl/ElazarKRRHSG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Quality}
}

@inproceedings{DBLP:conf/eacl/HaseDCLKSBI23,
  author       = {Peter Hase and
                  Mona T. Diab and
                  Asli Celikyilmaz and
                  Xian Li and
                  Zornitsa Kozareva and
                  Veselin Stoyanov and
                  Mohit Bansal and
                  Srinivasan Iyer},
  editor       = {Andreas Vlachos and
                  Isabelle Augenstein},
  title        = {Methods for Measuring, Updating, and Visualizing Factual Beliefs in
                  Language Models},
  booktitle    = {EACL},
  pages        = {2706--2723},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.eacl-main.199},
  timestamp    = {Thu, 11 May 2023 17:08:21 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/HaseDCLKSBI23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}


@inproceedings{DBLP:conf/acl/0008CJ0023,
  author       = {Yuan He and
                  Jiaoyan Chen and
                  Ernesto Jim{\'{e}}nez{-}Ruiz and
                  Hang Dong and
                  Ian Horrocks},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Language Model Analysis for Ontology Subsumption Inference},
  booktitle    = {ACL},
  pages        = {3439--3453},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.213},
  doi          = {10.18653/v1/2023.findings-acl.213},
  timestamp    = {Thu, 10 Aug 2023 12:36:04 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/0008CJ0023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords  = {Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/acl/HaoTTNSZXH23,
  author       = {Shibo Hao and
                  Bowen Tan and
                  Kaiwen Tang and
                  Bin Ni and
                  Xiyan Shao and
                  Hengzhe Zhang and
                  Eric P. Xing and
                  Zhiting Hu},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {BertNet: Harvesting Knowledge Graphs with Arbitrary Relations from
                  Pretrained Language Models},
  booktitle    = {ACL},
  pages        = {5000--5015},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.309},
  doi          = {10.18653/v1/2023.findings-acl.309},
  timestamp    = {Thu, 10 Aug 2023 12:35:49 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/HaoTTNSZXH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/acl/JiangAJW0023,
  author       = {Pengcheng Jiang and
                  Shivam Agarwal and
                  Bowen Jin and
                  Xuan Wang and
                  Jimeng Sun and
                  Jiawei Han},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Text Augmented Open Knowledge Graph Completion via Pre-Trained Language
                  Models},
  booktitle    = {ACL},
  pages        = {11161--11180},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.709},
  doi          = {10.18653/v1/2023.findings-acl.709},
  timestamp    = {Wed, 30 Aug 2023 15:34:14 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/JiangAJW0023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2309-11495,
  author       = {Shehzaad Dhuliawala and
                  Mojtaba Komeili and
                  Jing Xu and
                  Roberta Raileanu and
                  Xian Li and
                  Asli Celikyilmaz and
                  Jason Weston},
  title        = {Chain-of-Verification Reduces Hallucination in Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2309.11495},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.11495},
  doi          = {10.48550/arXiv.2309.11495},
  eprinttype    = {arXiv},
  eprint       = {2309.11495},
  timestamp    = {Mon, 25 Sep 2023 15:34:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-11495.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Verification}
}

@inproceedings{DBLP:conf/iclr/ShiSF0SVCTRZ0W23,
  author       = {Freda Shi and
                  Mirac Suzgun and
                  Markus Freitag and
                  Xuezhi Wang and
                  Suraj Srivats and
                  Soroush Vosoughi and
                  Hyung Won Chung and
                  Yi Tay and
                  Sebastian Ruder and
                  Denny Zhou and
                  Dipanjan Das and
                  Jason Wei},
  title        = {Language models are multilingual chain-of-thought reasoners},
  booktitle    = {ICLR},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=fR3wGCk-IXp},
  timestamp    = {Fri, 30 Jun 2023 14:55:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ShiSF0SVCTRZ0W23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2307-02046,
  author       = {Wenqi Fan and
                  Zihuai Zhao and
                  Jiatong Li and
                  Yunqing Liu and
                  Xiaowei Mei and
                  Yiqi Wang and
                  Jiliang Tang and
                  Qing Li},
  title        = {Recommender Systems in the Era of Large Language Models (LLMs)},
  journal      = {CoRR},
  volume       = {abs/2307.02046},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.02046},
  doi          = {10.48550/arXiv.2307.02046},
  eprinttype    = {arXiv},
  eprint       = {2307.02046},
  timestamp    = {Sat, 30 Sep 2023 10:10:47 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-02046.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Recommender System}
}

@article{DBLP:journals/corr/abs-2303-04226,
  author       = {Yihan Cao and
                  Siyu Li and
                  Yixin Liu and
                  Zhiling Yan and
                  Yutong Dai and
                  Philip S. Yu and
                  Lichao Sun},
  title        = {A Comprehensive Survey of AI-Generated Content {(AIGC):} {A} History
                  of Generative {AI} from {GAN} to ChatGPT},
  journal      = {CoRR},
  volume       = {abs/2303.04226},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.04226},
  doi          = {10.48550/arXiv.2303.04226},
  eprinttype    = {arXiv},
  eprint       = {2303.04226},
  timestamp    = {Thu, 16 Mar 2023 08:47:21 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-04226.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@misc{shi2023mededit,
      title={MedEdit: Model Editing for Medical Question Answering with External Knowledge Bases},
      author={Yucheng Shi and Shaochen Xu and Zhengliang Liu and Tianming Liu and Xiang Li and Ninghao Liu},
      year={2023},
      eprint={2309.16035},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/pdf/2309.16035.pdf},
      keywords = {Knowledge Editing}
}


@article{DBLP:journals/corr/abs-2305-16582,
  author       = {Yao Yao and
                  Zuchao Li and
                  Hai Zhao},
  title        = {Beyond Chain-of-Thought, Effective Graph-of-Thought Reasoning in Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2305.16582},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.16582},
  doi          = {10.48550/arXiv.2305.16582},
  eprinttype    = {arXiv},
  eprint       = {2305.16582},
  timestamp    = {Wed, 07 Jun 2023 14:31:13 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-16582.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2308-06207,
  author       = {Fanglong Yao and
                  Changyuan Tian and
                  Jintao Liu and
                  Zequn Zhang and
                  Qing Liu and
                  Li Jin and
                  Shuchao Li and
                  Xiaoyu Li and
                  Xian Sun},
  title        = {Thinking Like an Expert: Multimodal Hypergraph-of-Thought (HoT) Reasoning
                  to boost Foundation Modals},
  journal      = {CoRR},
  volume       = {abs/2308.06207},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.06207},
  doi          = {10.48550/arXiv.2308.06207},
  eprinttype    = {arXiv},
  eprint       = {2308.06207},
  timestamp    = {Wed, 23 Aug 2023 14:43:32 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-06207.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2309-04461,
  author       = {Yangyi Chen and
                  Karan Sikka and
                  Michael Cogswell and
                  Heng Ji and
                  Ajay Divakaran},
  title        = {Measuring and Improving Chain-of-Thought Reasoning in Vision-Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2309.04461},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.04461},
  doi          = {10.48550/arXiv.2309.04461},
  eprinttype    = {arXiv},
  eprint       = {2309.04461},
  timestamp    = {Tue, 12 Sep 2023 12:50:52 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-04461.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2308-08614,
  author       = {Bin Lei and
                  Pei{-}Hung Lin and
                  Chunhua Liao and
                  Caiwen Ding},
  title        = {Boosting Logical Reasoning in Large Language Models through a New
                  Framework: The Graph of Thought},
  journal      = {CoRR},
  volume       = {abs/2308.08614},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.08614},
  doi          = {10.48550/arXiv.2308.08614},
  eprinttype    = {arXiv},
  eprint       = {2308.08614},
  timestamp    = {Fri, 25 Aug 2023 11:24:49 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-08614.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2305-10601,
  author       = {Shunyu Yao and
                  Dian Yu and
                  Jeffrey Zhao and
                  Izhak Shafran and
                  Thomas L. Griffiths and
                  Yuan Cao and
                  Karthik Narasimhan},
  title        = {Tree of Thoughts: Deliberate Problem Solving with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2305.10601},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.10601},
  doi          = {10.48550/arXiv.2305.10601},
  eprinttype    = {arXiv},
  eprint       = {2305.10601},
  timestamp    = {Thu, 25 May 2023 15:41:47 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-10601.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}


@article{DBLP:journals/corr/abs-2308-09658,
  author       = {Pengbo Hu and
                  Ji Qi and
                  Xingyu Li and
                  Hong Li and
                  Xinqi Wang and
                  Bing Quan and
                  Ruiyu Wang and
                  Yi Zhou},
  title        = {Tree-of-Mixed-Thought: Combining Fast and Slow Thinking for Multi-hop
                  Visual Reasoning},
  journal      = {CoRR},
  volume       = {abs/2308.09658},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.09658},
  doi          = {10.48550/arXiv.2308.09658},
  eprinttype    = {arXiv},
  eprint       = {2308.09658},
  timestamp    = {Fri, 25 Aug 2023 11:24:49 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-09658.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2308-10792,
  author       = {Shengyu Zhang and
                  Linfeng Dong and
                  Xiaoya Li and
                  Sen Zhang and
                  Xiaofei Sun and
                  Shuhe Wang and
                  Jiwei Li and
                  Runyi Hu and
                  Tianwei Zhang and
                  Fei Wu and
                  Guoyin Wang},
  title        = {Instruction Tuning for Large Language Models: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2308.10792},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.10792},
  doi          = {10.48550/arXiv.2308.10792},
  eprinttype    = {arXiv},
  eprint       = {2308.10792},
  timestamp    = {Wed, 30 Aug 2023 17:27:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-10792.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2305-14726,
  author       = {Dan Iter and
                  Reid Pryzant and
                  Ruochen Xu and
                  Shuohang Wang and
                  Yang Liu and
                  Yichong Xu and
                  Chenguang Zhu},
  title        = {In-Context Demonstration Selection with Cross Entropy Difference},
  journal      = {CoRR},
  volume       = {abs/2305.14726},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14726},
  doi          = {10.48550/arXiv.2305.14726},
  eprinttype    = {arXiv},
  eprint       = {2305.14726},
  timestamp    = {Thu, 29 Jun 2023 16:58:03 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14726.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
  }

  @inproceedings{DBLP:conf/acl/MonajatipoorLR023,
  author       = {Masoud Monajatipoor and
                  Liunian Harold Li and
                  Mozhdeh Rouhsedaghat and
                  Lin Yang and
                  Kai{-}Wei Chang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {MetaVL: Transferring In-Context Learning Ability From Language Models
                  to Vision-Language Models},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 2: Short Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {495--508},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-short.43},
  doi          = {10.18653/v1/2023.acl-short.43},
  timestamp    = {Thu, 10 Aug 2023 12:35:40 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/MonajatipoorLR023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2307-07742,
  author       = {Yi{-}Syuan Chen and
                  Yun{-}Zhu Song and
                  Cheng Yu Yeo and
                  Bei Liu and
                  Jianlong Fu and
                  Hong{-}Han Shuai},
  title        = {{SINC:} Self-Supervised In-Context Learning for Vision-Language Tasks},
  journal      = {CoRR},
  volume       = {abs/2307.07742},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.07742},
  doi          = {10.48550/arXiv.2307.07742},
  eprinttype    = {arXiv},
  eprint       = {2307.07742},
  timestamp    = {Tue, 25 Jul 2023 16:04:08 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-07742.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2309-16289,
  author       = {Zhiwei Fei and
                  Xiaoyu Shen and
                  Dawei Zhu and
                  Fengzhe Zhou and
                  Zhuo Han and
                  Songyang Zhang and
                  Kai Chen and
                  Zongwen Shen and
                  Jidong Ge},
  title        = {LawBench: Benchmarking Legal Knowledge of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2309.16289},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.16289},
  doi          = {10.48550/ARXIV.2309.16289},
  eprinttype    = {arXiv},
  eprint       = {2309.16289},
  timestamp    = {Tue, 17 Oct 2023 13:50:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-16289.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Application}
}

@article{DBLP:journals/corr/abs-2308-11462,
  author       = {Neel Guha and
                  Julian Nyarko and
                  Daniel E. Ho and
                  Christopher R{\'{e}} and
                  Adam Chilton and
                  Aditya Narayana and
                  Alex Chohlas{-}Wood and
                  Austin Peters and
                  Brandon Waldon and
                  Daniel N. Rockmore and
                  Diego Zambrano and
                  Dmitry Talisman and
                  Enam Hoque and
                  Faiz Surani and
                  Frank Fagan and
                  Galit Sarfaty and
                  Gregory M. Dickinson and
                  Haggai Porat and
                  Jason Hegland and
                  Jessica Wu and
                  Joe Nudell and
                  Joel Niklaus and
                  John J. Nay and
                  Jonathan H. Choi and
                  Kevin Tobia and
                  Margaret Hagan and
                  Megan Ma and
                  Michael A. Livermore and
                  Nikon Rasumov{-}Rahe and
                  Nils Holzenberger and
                  Noam Kolt and
                  Peter Henderson and
                  Sean Rehaag and
                  Sharad Goel and
                  Shang Gao and
                  Spencer Williams and
                  Sunny Gandhi and
                  Tom Zur and
                  Varun Iyer and
                  Zehua Li},
  title        = {LegalBench: {A} Collaboratively Built Benchmark for Measuring Legal
                  Reasoning in Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2308.11462},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.11462},
  doi          = {10.48550/ARXIV.2308.11462},
  eprinttype    = {arXiv},
  eprint       = {2308.11462},
  timestamp    = {Wed, 30 Aug 2023 17:27:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-11462.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Application}
}


@article{DBLP:journals/corr/abs-2310-07521,
  author       = {Cunxiang Wang and
                  Xiaoze Liu and
                  Yuanhao Yue and
                  Xiangru Tang and
                  Tianhang Zhang and
                  Jiayang Cheng and
                  Yunzhi Yao and
                  Wenyang Gao and
                  Xuming Hu and
                  Zehan Qi and
                  Yidong Wang and
                  Linyi Yang and
                  Jindong Wang and
                  Xing Xie and
                  Zheng Zhang and
                  Yue Zhang},
  title        = {Survey on Factuality in Large Language Models: Knowledge, Retrieval
                  and Domain-Specificity},
  journal      = {CoRR},
  volume       = {abs/2310.07521},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.07521},
  doi          = {10.48550/ARXIV.2310.07521},
  eprinttype    = {arXiv},
  eprint       = {2310.07521},
  timestamp    = {Tue, 24 Oct 2023 14:46:18 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-07521.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2308-13676,
  author       = {Vishwas Mruthyunjaya and
                  Pouya Pezeshkpour and
                  Estevam Hruschka and
                  Nikita Bhutani},
  title        = {Rethinking Language Models as Symbolic Knowledge Graphs},
  journal      = {CoRR},
  volume       = {abs/2308.13676},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.13676},
  doi          = {10.48550/ARXIV.2308.13676},
  eprinttype    = {arXiv},
  eprint       = {2308.13676},
  timestamp    = {Fri, 01 Sep 2023 14:25:01 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-13676.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@inproceedings{DBLP:conf/acl/ZhangG023,
  author       = {Kai Zhang and
                  Bernal Jimenez Gutierrez and
                  Yu Su},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Aligning Instruction Tasks Unlocks Large Language Models as Zero-Shot
                  Relation Extractors},
  booktitle    = {ACL},
  pages        = {794--812},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.50},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.50},
  timestamp    = {Thu, 10 Aug 2023 12:35:40 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhangG023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@misc{chen2023demonstrations,
      title={How Many Demonstrations Do You Need for In-context Learning?},
      author={Jiuhai Chen and Lichang Chen and Chen Zhu and Tianyi Zhou},
      year={2023},
      eprint={2303.08119},
      archivePrefix={arXiv},
      primaryClass={cs.AI},
      url = {https://arxiv.org/pdf/2303.08119.pdf},
      keywords = {In-Context Learning}
}

@misc{han2023explaining,
      title={Explaining Emergent In-Context Learning as Kernel Regression},
      author={Chi Han and Ziqi Wang and Han Zhao and Heng Ji},
      year={2023},
      eprint={2305.12766},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2305.12766},
      keywords = {In-Context Learning}
}

@inproceedings{DBLP:conf/iclr/Jin0P023,
  author       = {Xisen Jin and
                  Xiang Ren and
                  Daniel Preotiuc{-}Pietro and
                  Pengxiang Cheng},
  title        = {Dataless Knowledge Fusion by Merging Weights of Language Models},
  booktitle    = {ICLR},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=FCnohuR6AnM},
  timestamp    = {Fri, 30 Jun 2023 14:55:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Jin0P023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}


@article{DBLP:journals/corr/abs-2309-15698,
  author       = {Weishi Li and
                  Yong Peng and
                  Miao Zhang and
                  Liang Ding and
                  Han Hu and
                  Li Shen},
  title        = {Deep Model Fusion: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2309.15698},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.15698},
  doi          = {10.48550/ARXIV.2309.15698},
  eprinttype    = {arXiv},
  eprint       = {2309.15698},
  timestamp    = {Tue, 17 Oct 2023 13:50:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-15698.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@article{DBLP:journals/corr/abs-2310-02575,
  author       = {Enneng Yang and
                  Zhenyi Wang and
                  Li Shen and
                  Shiwei Liu and
                  Guibing Guo and
                  Xingwei Wang and
                  Dacheng Tao},
  title        = {AdaMerging: Adaptive Model Merging for Multi-Task Learning},
  journal      = {CoRR},
  volume       = {abs/2310.02575},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02575},
  doi          = {10.48550/ARXIV.2310.02575},
  eprinttype    = {arXiv},
  eprint       = {2310.02575},
  timestamp    = {Thu, 19 Oct 2023 13:12:52 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02575.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}

@article{DBLP:journals/corr/abs-2306-01708,
  author       = {Prateek Yadav and
                  Derek Tam and
                  Leshem Choshen and
                  Colin Raffel and
                  Mohit Bansal},
  title        = {Resolving Interference When Merging Models},
  journal      = {CoRR},
  volume       = {abs/2306.01708},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.01708},
  doi          = {10.48550/ARXIV.2306.01708},
  eprinttype    = {arXiv},
  eprint       = {2306.01708},
  timestamp    = {Mon, 12 Jun 2023 16:25:59 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-01708.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}

@article{DBLP:journals/corr/abs-2310-01334,
  author       = {Pingzhi Li and
                  Zhenyu Zhang and
                  Prateek Yadav and
                  Yi{-}Lin Sung and
                  Yu Cheng and
                  Mohit Bansal and
                  Tianlong Chen},
  title        = {Merge, Then Compress: Demystify Efficient SMoE with Hints from Its
                  Routing Policy},
  journal      = {CoRR},
  volume       = {abs/2310.01334},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.01334},
  doi          = {10.48550/ARXIV.2310.01334},
  eprinttype    = {arXiv},
  eprint       = {2310.01334},
  timestamp    = {Wed, 18 Oct 2023 16:20:58 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-01334.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}

@misc{daheim2023model,
      title={Model Merging by Uncertainty-Based Gradient Matching},
      author={Nico Daheim and Thomas Möllenhoff and Edoardo Maria Ponti and Iryna Gurevych and Mohammad Emtiyaz Khan},
      year={2023},
      eprint={2310.12808},
      archivePrefix={arXiv},
      primaryClass={cs.LG},
      url = {https://arxiv.org/abs/2310.12808},
      keywords = {Knowledge Fusion}
}

@article{DBLP:journals/corr/abs-2309-02144,
  author       = {Peiyi Wang and
                  Lei Li and
                  Liang Chen and
                  Feifan Song and
                  Binghuai Lin and
                  Yunbo Cao and
                  Tianyu Liu and
                  Zhifang Sui},
  title        = {Making Large Language Models Better Reasoners with Alignment},
  journal      = {CoRR},
  volume       = {abs/2309.02144},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.02144},
  doi          = {10.48550/ARXIV.2309.02144},
  eprinttype    = {arXiv},
  eprint       = {2309.02144},
  timestamp    = {Wed, 13 Sep 2023 11:57:05 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-02144.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@misc{li2023making,
      title={Making Large Language Models Better Reasoners with Step-Aware Verifier},
      author={Yifei Li and Zeqi Lin and Shizhuo Zhang and Qiang Fu and Bei Chen and Jian-Guang Lou and Weizhu Chen},
      year={2023},
      eprint={2206.02336},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2206.02336},
      keywords = {Chain of Thought}
}

@inproceedings{DBLP:conf/acl/HsiehLYNFRKLP23,
  author       = {Cheng{-}Yu Hsieh and
                  Chun{-}Liang Li and
                  Chih{-}Kuan Yeh and
                  Hootan Nakhost and
                  Yasuhisa Fujii and
                  Alex Ratner and
                  Ranjay Krishna and
                  Chen{-}Yu Lee and
                  Tomas Pfister},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Distilling Step-by-Step! Outperforming Larger Language Models with
                  Less Training Data and Smaller Model Sizes},
  booktitle    = {ACL},
  pages        = {8003--8017},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.507},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.507},
  timestamp    = {Thu, 10 Aug 2023 12:36:02 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/HsiehLYNFRKLP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Distillation}
}


@article{DBLP:journals/corr/abs-2310-01542,
  author       = {Hongyi Wang and
                  Felipe Maia Polo and
                  Yuekai Sun and
                  Souvik Kundu and
                  Eric P. Xing and
                  Mikhail Yurochkin},
  title        = {Fusing Models with Complementary Expertise},
  journal      = {CoRR},
  volume       = {abs/2310.01542},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.01542},
  doi          = {10.48550/ARXIV.2310.01542},
  eprinttype    = {arXiv},
  eprint       = {2310.01542},
  timestamp    = {Thu, 19 Oct 2023 13:12:52 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-01542.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}

@inproceedings{DBLP:conf/iclr/FuPSCK23,
  author       = {Yao Fu and
                  Hao Peng and
                  Ashish Sabharwal and
                  Peter Clark and
                  Tushar Khot},
  title        = {Complexity-Based Prompting for Multi-step Reasoning},
  booktitle    = {ICLR},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=yf1icZHC-l9},
  timestamp    = {Fri, 30 Jun 2023 14:55:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/FuPSCK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Multi-Step Reasoning}
}

@article{DBLP:journals/corr/abs-2310-02527,
  author       = {Tao Feng and
                  Zifeng Wang and
                  Jimeng Sun},
  title        = {{CITING:} Large Language Models Create Curriculum for Instruction
                  Tuning},
  journal      = {CoRR},
  volume       = {abs/2310.02527},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02527},
  doi          = {10.48550/ARXIV.2310.02527},
  eprinttype    = {arXiv},
  eprint       = {2310.02527},
  timestamp    = {Mon, 23 Oct 2023 15:28:12 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02527.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}

@article{DBLP:journals/corr/abs-2309-15402,
  author       = {Zheng Chu and
                  Jingchang Chen and
                  Qianglong Chen and
                  Weijiang Yu and
                  Tao He and
                  Haotian Wang and
                  Weihua Peng and
                  Ming Liu and
                  Bing Qin and
                  Ting Liu},
  title        = {A Survey of Chain of Thought Reasoning: Advances, Frontiers and Future},
  journal      = {CoRR},
  volume       = {abs/2309.15402},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.15402},
  doi          = {10.48550/ARXIV.2309.15402},
  eprinttype    = {arXiv},
  eprint       = {2309.15402},
  timestamp    = {Tue, 17 Oct 2023 13:50:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-15402.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@inproceedings{DBLP:conf/eacl/AllawayHBMDC23,
  author       = {Emily Allaway and
                  Jena D. Hwang and
                  Chandra Bhagavatula and
                  Kathleen R. McKeown and
                  Doug Downey and
                  Yejin Choi},
  editor       = {Andreas Vlachos and
                  Isabelle Augenstein},
  title        = {Penguins Don't Fly: Reasoning about Generics through Instantiations
                  and Exceptions},
  booktitle    = {EACL},
  pages        = {2610--2627},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.eacl-main.192},
  doi          = {10.18653/V1/2023.EACL-MAIN.192},
  timestamp    = {Thu, 05 Oct 2023 18:05:03 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/AllawayHBMDC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}


@inproceedings{DBLP:conf/acl/LaskarBRBJH23,
  author       = {Md. Tahmid Rahman Laskar and
                  M. Saiful Bari and
                  Mizanur Rahman and
                  Md Amran Hossen Bhuiyan and
                  Shafiq Joty and
                  Jimmy X. Huang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {A Systematic Study and Comprehensive Evaluation of ChatGPT on Benchmark
                  Datasets},
  booktitle    = {ACL},
  pages        = {431--469},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.29},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.29},
  timestamp    = {Thu, 10 Aug 2023 12:36:06 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LaskarBRBJH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Evaluation}
}


@article{DBLP:journals/corr/abs-2308-12488,
  author       = {Rui Mao and
                  Guanyi Chen and
                  Xulang Zhang and
                  Frank Guerin and
                  Erik Cambria},
  title        = {GPTEval: {A} Survey on Assessments of ChatGPT and {GPT-4}},
  journal      = {CoRR},
  volume       = {abs/2308.12488},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.12488},
  doi          = {10.48550/ARXIV.2308.12488},
  eprinttype    = {arXiv},
  eprint       = {2308.12488},
  timestamp    = {Wed, 30 Aug 2023 17:27:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-12488.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Evaluation}
}

@article{DBLP:journals/corr/abs-2310-05028,
  author       = {Guozheng Li and
                  Peng Wang and
                  Wenjun Ke},
  title        = {Revisiting Large Language Models as Zero-shot Relation Extractors},
  journal      = {CoRR},
  volume       = {abs/2310.05028},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.05028},
  doi          = {10.48550/ARXIV.2310.05028},
  eprinttype    = {arXiv},
  eprint       = {2310.05028},
  timestamp    = {Fri, 20 Oct 2023 12:04:38 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-05028.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@article{DBLP:journals/corr/abs-2310-06692,
  author       = {Anni Zou and
                  Zhuosheng Zhang and
                  Hai Zhao and
                  Xiangru Tang},
  title        = {Meta-CoT: Generalizable Chain-of-Thought Prompting in Mixed-task Scenarios
                  with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2310.06692},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06692},
  doi          = {10.48550/ARXIV.2310.06692},
  eprinttype    = {arXiv},
  eprint       = {2310.06692},
  timestamp    = {Tue, 24 Oct 2023 14:46:18 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}


@article{DBLP:journals/corr/abs-2305-04978,
  author       = {Phillip Howard and
                  Junlin Wang and
                  Vasudev Lal and
                  Gadi Singer and
                  Yejin Choi and
                  Swabha Swayamdipta},
  title        = {NeuroComparatives: Neuro-Symbolic Distillation of Comparative Knowledge},
  journal      = {CoRR},
  volume       = {abs/2305.04978},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.04978},
  doi          = {10.48550/ARXIV.2305.04978},
  eprinttype    = {arXiv},
  eprint       = {2305.04978},
  timestamp    = {Fri, 12 May 2023 16:06:58 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-04978.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}

@article{DBLP:journals/corr/abs-2305-14898,
  author       = {Keming Lu and
                  Xiaoman Pan and
                  Kaiqiang Song and
                  Hongming Zhang and
                  Dong Yu and
                  Jianshu Chen},
  title        = {{PIVOINE:} Instruction Tuning for Open-world Information Extraction},
  journal      = {CoRR},
  volume       = {abs/2305.14898},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14898},
  doi          = {10.48550/ARXIV.2305.14898},
  eprinttype    = {arXiv},
  eprint       = {2305.14898},
  timestamp    = {Wed, 21 Jun 2023 15:57:12 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14898.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2310-12537,
  author       = {Alexander Brinkmann and
                  Roee Shraga and
                  Christian Bizer},
  title        = {Product Attribute Value Extraction using Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2310.12537},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.12537},
  doi          = {10.48550/ARXIV.2310.12537},
  eprinttype    = {arXiv},
  eprint       = {2310.12537},
  timestamp    = {Fri, 27 Oct 2023 12:21:19 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-12537.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2305-02105,
  author       = {Zhen Wan and
                  Fei Cheng and
                  Zhuoyuan Mao and
                  Qianying Liu and
                  Haiyue Song and
                  Jiwei Li and
                  Sadao Kurohashi},
  title        = {{GPT-RE:} In-context Learning for Relation Extraction using Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2305.02105},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.02105},
  doi          = {10.48550/ARXIV.2305.02105},
  eprinttype    = {arXiv},
  eprint       = {2305.02105},
  timestamp    = {Fri, 05 May 2023 14:35:02 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-02105.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/acl/ChenSFC0X23,
  author       = {Jiangjie Chen and
                  Wei Shi and
                  Ziquan Fu and
                  Sijie Cheng and
                  Lei Li and
                  Yanghua Xiao},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Say What You Mean! Large Language Models Speak Too Positively about
                  Negative Commonsense Knowledge},
  booktitle    = {ACL},
  pages        = {9890--9908},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.550},
  doi          = {10.18653/V1/2023.ACL-LONG.550},
  timestamp    = {Tue, 22 Aug 2023 07:49:35 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChenSFC0X23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}

@inproceedings{DBLP:conf/acl/WuZH23,
  author       = {Dingjun Wu and
                  Jing Zhang and
                  Xinmei Huang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Chain of Thought Prompting Elicits Knowledge Augmentation},
  booktitle    = {ACL},
  pages        = {6519--6534},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.408},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.408},
  timestamp    = {Thu, 10 Aug 2023 12:36:05 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WuZH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2309-17382,
  author       = {Zhihan Liu and
                  Hao Hu and
                  Shenao Zhang and
                  Hongyi Guo and
                  Shuqi Ke and
                  Boyi Liu and
                  Zhaoran Wang},
  title        = {Reason for Future, Act for Now: {A} Principled Framework for Autonomous
                  {LLM} Agents with Provable Sample Efficiency},
  journal      = {CoRR},
  volume       = {abs/2309.17382},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.17382},
  doi          = {10.48550/ARXIV.2309.17382},
  eprinttype    = {arXiv},
  eprint       = {2309.17382},
  timestamp    = {Tue, 17 Oct 2023 13:50:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-17382.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Agent}
}


@unknown{unknown,
author = {Alessandro Sordoni and Xingdi Yuan and Marc-Alexandre Cote and Matheus Pereira and Adam Trischler and Ziang Xiao
 and Arian Hosseini and Friederike Niedtner and Nicolas Le Roux},
year = {2023},
month = {},
pages = {24},
title = {Joint Prompt Optimization of Stacked LLMs using Variational Inference},
url = {https://openreview.net/pdf?id=iImnbUVhok},
keywords = {Prompt Engineering}
}


@inproceedings{DBLP:conf/kdd/SunCLLG23,
  author       = {Xiangguo Sun and
                  Hong Cheng and
                  Jia Li and
                  Bo Liu and
                  Jihong Guan},
  editor       = {Ambuj K. Singh and
                  Yizhou Sun and
                  Leman Akoglu and
                  Dimitrios Gunopulos and
                  Xifeng Yan and
                  Ravi Kumar and
                  Fatma Ozcan and
                  Jieping Ye},
  title        = {All in One: Multi-Task Prompting for Graph Neural Networks},
  booktitle    = {KDD},
  pages        = {2120--2131},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3580305.3599256},
  doi          = {10.1145/3580305.3599256},
  timestamp    = {Mon, 25 Sep 2023 08:29:22 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/SunCLLG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and GNN}
}

@article{DBLP:journals/corr/abs-2309-15427,
  author       = {Yijun Tian and
                  Huan Song and
                  Zichen Wang and
                  Haozhu Wang and
                  Ziqing Hu and
                  Fang Wang and
                  Nitesh V. Chawla and
                  Panpan Xu},
  title        = {Graph Neural Prompting with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2309.15427},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.15427},
  doi          = {10.48550/ARXIV.2309.15427},
  eprinttype    = {arXiv},
  eprint       = {2309.15427},
  timestamp    = {Tue, 17 Oct 2023 13:50:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-15427.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and GNN}
}

@article{DBLP:journals/corr/abs-2311-16534,
  author       = {Xiangguo Sun and
                  Jiawen Zhang and
                  Xixi Wu and
                  Hong Cheng and
                  Yun Xiong and
                  Jia Li},
  title        = {Graph Prompt Learning: {A} Comprehensive Survey and Beyond},
  journal      = {CoRR},
  volume       = {abs/2311.16534},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.16534},
  doi          = {10.48550/ARXIV.2311.16534},
  eprinttype    = {arXiv},
  eprint       = {2311.16534},
  timestamp    = {Mon, 04 Dec 2023 10:53:08 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-16534.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and GNN}
}

@misc{jin2023large,
    title={Large Language Models on Graphs: A Comprehensive Survey},
    author={Bowen Jin and Gang Liu and Chi Han and Meng Jiang and Heng Ji and Jiawei Han},
    year={2023},
    eprint={2312.02783},
    archivePrefix={arXiv},
    primaryClass={cs.CL},
    url = {https://export.arxiv.org/abs/2312.02783},
    keywords = {LLM and GNN}
}

@article{DBLP:journals/corr/abs-2311-07850,
  author       = {Dhruv Agarwal and
                  Rajarshi Das and
                  Sopan Khosla and
                  Rashmi Gangadharaiah},
  title        = {Bring Your Own {KG:} Self-Supervised Program Synthesis for Zero-Shot
                  {KGQA}},
  journal      = {CoRR},
  volume       = {abs/2311.07850},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.07850},
  doi          = {10.48550/ARXIV.2311.07850},
  eprinttype    = {arXiv},
  eprint       = {2311.07850},
  timestamp    = {Tue, 21 Nov 2023 13:55:21 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-07850.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}


@inproceedings{DBLP:conf/kdd/SunZHWW22,
  author       = {Mingchen Sun and
                  Kaixiong Zhou and
                  Xin He and
                  Ying Wang and
                  Xin Wang},
  editor       = {Aidong Zhang and
                  Huzefa Rangwala},
  title        = {{GPPT:} Graph Pre-training and Prompt Tuning to Generalize Graph Neural
                  Networks},
  booktitle    = {KDD},
  pages        = {1717--1727},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3534678.3539249},
  doi          = {10.1145/3534678.3539249},
  timestamp    = {Sat, 30 Sep 2023 09:51:45 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/SunZHWW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and GNN}
}

@article{DBLP:journals/corr/abs-2309-01029,
  author       = {Haiyan Zhao and
                  Hanjie Chen and
                  Fan Yang and
                  Ninghao Liu and
                  Huiqi Deng and
                  Hengyi Cai and
                  Shuaiqiang Wang and
                  Dawei Yin and
                  Mengnan Du},
  title        = {Explainability for Large Language Models: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2309.01029},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.01029},
  doi          = {10.48550/ARXIV.2309.01029},
  eprinttype    = {arXiv},
  eprint       = {2309.01029},
  timestamp    = {Mon, 11 Sep 2023 16:01:35 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-01029.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@misc{xu2023large,
      title={Large Language Models for Generative Information Extraction: A Survey},
      author={Derong Xu and Wei Chen and Wenjun Peng and Chao Zhang and Tong Xu and Xiangyu Zhao and Xian Wu and Yefeng Zheng and Enhong Chen},
      year={2023},
      eprint={2312.17617},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2312.17617},
      keywords = {Survey}
}


@inproceedings{DBLP:conf/semweb/MihindukulasooriyaTEL23,
  author       = {Nandana Mihindukulasooriya and
                  Sanju Tiwari and
                  Carlos F. Enguix and
                  Kusum Lata},
  editor       = {Terry R. Payne and
                  Valentina Presutti and
                  Guilin Qi and
                  Mar{\'{\i}}a Poveda{-}Villal{\'{o}}n and
                  Giorgos Stoilos and
                  Laura Hollink and
                  Zoi Kaoudi and
                  Gong Cheng and
                  Juanzi Li},
  title        = {Text2KGBench: {A} Benchmark for Ontology-Driven Knowledge Graph Generation
                  from Text},
  booktitle    = {ISWC},
  series       = {Lecture Notes in Computer Science},
  volume       = {14266},
  pages        = {247--265},
  publisher    = {Springer},
  year         = {2023},
  url          = {https://doi.org/10.1007/978-3-031-47243-5\_14},
  doi          = {10.1007/978-3-031-47243-5\_14},
  timestamp    = {Thu, 09 Nov 2023 21:12:57 +0100},
  biburl       = {https://dblp.org/rec/conf/semweb/MihindukulasooriyaTEL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@inproceedings{DBLP:conf/emnlp/GaoD0023,
  author       = {Jinglong Gao and
                  Xiao Ding and
                  Bing Qin and
                  Ting Liu},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Is ChatGPT a Good Causal Reasoner? {A} Comprehensive Evaluation},
  booktitle    = {EMNLP},
  pages        = {11111--11126},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.findings-emnlp.743},
  timestamp    = {Wed, 13 Dec 2023 17:20:20 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/GaoD0023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Event Relation Extraction}
}

@article{DBLP:journals/corr/abs-2402-01619,
  author       = {Jiajie Zhang and
                  Shulin Cao and
                  Linmei Hu and
                  Ling Feng and
                  Lei Hou and
                  Juanzi Li},
  title        = {KB-Plugin: {A} Plug-and-play Framework for Large Language Models to
                  Induce Programs over Low-resourced Knowledge Bases},
  journal      = {CoRR},
  volume       = {abs/2402.01619},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.01619},
  doi          = {10.48550/ARXIV.2402.01619},
  eprinttype    = {arXiv},
  eprint       = {2402.01619},
  timestamp    = {Fri, 09 Feb 2024 12:18:48 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-01619.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}

@article{DBLP:journals/corr/abs-2311-12399,
  author       = {Yuhan Li and
                  Zhixun Li and
                  Peisong Wang and
                  Jia Li and
                  Xiangguo Sun and
                  Hong Cheng and
                  Jeffrey Xu Yu},
  title        = {A Survey of Graph Meets Large Language Model: Progress and Future
                  Directions},
  journal      = {CoRR},
  volume       = {abs/2311.12399},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.12399},
  doi          = {10.48550/ARXIV.2311.12399},
  eprinttype    = {arXiv},
  eprint       = {2311.12399},
  timestamp    = {Wed, 29 Nov 2023 17:42:08 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-12399.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}

@inproceedings{DBLP:conf/emnlp/LuPSZYC23,
  author       = {Keming Lu and
                  Xiaoman Pan and
                  Kaiqiang Song and
                  Hongming Zhang and
                  Dong Yu and
                  Jianshu Chen},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {{PIVOINE:} Instruction Tuning for Open-world Entity Profiling},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2023, Singapore, December 6-10, 2023},
  pages        = {15108--15127},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.findings-emnlp.1009},
  timestamp    = {Wed, 13 Dec 2023 17:20:20 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/LuPSZYC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@misc{papaluca2023zero,
      title={Zero- and Few-Shots Knowledge Graph Triplet Extraction with Large Language Models},
      author={Andrea Papaluca and Daniel Krefl and Sergio Mendez Rodriguez and Artem Lensky and Hanna Suominen},
      year={2023},
      eprint={2312.01954},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2312.01954},
      keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/cvpr/TakashimaHIKY23,
  author       = {Sora Takashima and
                  Ryo Hayamizu and
                  Nakamasa Inoue and
                  Hirokatsu Kataoka and
                  Rio Yokota},
  title        = {Visual Atoms: Pre-Training Vision Transformers with Sinusoidal Waves},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {18579--18588},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPR52729.2023.01782},
  doi          = {10.1109/CVPR52729.2023.01782},
  timestamp    = {Tue, 29 Aug 2023 15:44:40 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/TakashimaHIKY23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Vision LLM}
}

@article{DBLP:journals/corr/abs-2304-10592,
  author       = {Deyao Zhu and
                  Jun Chen and
                  Xiaoqian Shen and
                  Xiang Li and
                  Mohamed Elhoseiny},
  title        = {MiniGPT-4: Enhancing Vision-Language Understanding with Advanced Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2304.10592},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.10592},
  doi          = {10.48550/ARXIV.2304.10592},
  eprinttype    = {arXiv},
  eprint       = {2304.10592},
  timestamp    = {Sat, 30 Sep 2023 10:10:35 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-10592.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Multimodal}
}

@inproceedings{DBLP:conf/nips/WangCCWZZLLZQD23,
  author       = {Wenhai Wang and
                  Zhe Chen and
                  Xiaokang Chen and
                  Jiannan Wu and
                  Xizhou Zhu and
                  Gang Zeng and
                  Ping Luo and
                  Tong Lu and
                  Jie Zhou and
                  Yu Qiao and
                  Jifeng Dai},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {VisionLLM: Large Language Model is also an Open-Ended Decoder for
                  Vision-Centric Tasks},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/c1f7b1ed763e9c75e4db74b49b76db5f-Abstract-Conference.html},
  timestamp    = {Thu, 29 Feb 2024 17:24:41 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WangCCWZZLLZQD23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Multimodal}
}

@inproceedings{DBLP:conf/emnlp/ChenJYCFHLG23,
  author       = {Zheng Chen and
                  Ziyan Jiang and
                  Fan Yang and
                  Eunah Cho and
                  Xing Fan and
                  Xiaojiang Huang and
                  Yanbin Lu and
                  Aram Galstyan},
  editor       = {Mingxuan Wang and
                  Imed Zitouni},
  title        = {Graph Meets {LLM:} {A} Novel Approach to Collaborative Filtering for
                  Robust Conversational Understanding},
  booktitle    = {EMNLP},
  pages        = {811--819},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.emnlp-industry.75},
  timestamp    = {Fri, 08 Dec 2023 12:36:34 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChenJYCFHLG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Graph Learning}
}

@article{DBLP:journals/corr/abs-2402-05894,
  author       = {Shengxiang Hu and
                  Guobing Zou and
                  Song Yang and
                  Yanglan Gan and
                  Bofeng Zhang and
                  Yixin Chen},
  title        = {Large Language Model Meets Graph Neural Network in Knowledge Distillation},
  journal      = {CoRR},
  volume       = {abs/2402.05894},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.05894},
  doi          = {10.48550/ARXIV.2402.05894},
  eprinttype    = {arXiv},
  eprint       = {2402.05894},
  timestamp    = {Fri, 16 Feb 2024 09:43:04 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-05894.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Graph Learning}
}

@misc{yang2024large,
    title={Do Large Language Models Latently Perform Multi-Hop Reasoning?},
    author={Sohee Yang and Elena Gribovskaya and Nora Kassner and Mor Geva and Sebastian Riedel},
    year={2024},
    eprint={2402.16837},
    archivePrefix={arXiv},
    primaryClass={cs.CL},
    url = {https://arxiv.org/pdf/2402.16837.pdf},
    keywords = {Reasoning}
}

@misc{yu2023prophet,
      title={Prophet: Prompting Large Language Models with Complementary Answer Heuristics for Knowledge-based Visual Question Answering},
      author={Zhou Yu and Xuecheng Ouyang and Zhenwei Shao and Meng Wang and Jun Yu},
      year={2023},
      eprint={2303.01903},
      archivePrefix={arXiv},
      primaryClass={cs.CV},
      url = {https://arxiv.org/pdf/2303.01903v3.pdf},
      keywords = {Question Answering}
}

@misc{wang2023keqing,
      title={keqing: knowledge-based question answering is a nature chain-of-thought mentor of LLM},
      author={Chaojie Wang and Yishi Xu and Zhong Peng and Chenxi Zhang and Bo Chen and Xinrun Wang and Lei Feng and Bo An},
      year={2023},
      eprint={2401.00426},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://openreview.net/pdf?id=bQfJLRlfYO},
      keywords = {Question Answering}
}

@misc{zhuang2024structlm,
      title={StructLM: Towards Building Generalist Models for Structured Knowledge Grounding},
      author={Alex Zhuang and Ge Zhang and Tianyu Zheng and Xinrun Du and Junjie Wang and Weiming Ren and Stephen W. Huang and Jie Fu and Xiang Yue and Wenhu Chen},
      year={2024},
      eprint={2402.16671},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2402.16671v2},
      keywords = {Question Answering}
}

@misc{liang2024aligning,
    title={Aligning Large Language Models to a Domain-specific Graph Database},
    author={Yuanyuan Liang and Keren Tan and Tingyu Xie and Wenbiao Tao and Siyuan Wang and Yunshi Lan and Weining Qian},
    year={2024},
    eprint={2402.16567},
    archivePrefix={arXiv},
    primaryClass={cs.CL},
    url = {http://export.arxiv.org/abs/2402.16567},
    keywords = {Question Answering}
}

@misc{besta2024topologies,
      title={Topologies of Reasoning: Demystifying Chains, Trees, and Graphs of Thoughts},
      author={Maciej Besta and Florim Memedi and Zhenyu Zhang and Robert Gerstenberger and Nils Blach and Piotr Nyczyk and Marcin Copik and Grzegorz Kwaśniewski and Jürgen Müller and Lukas Gianinazzi and Ales Kubicek and Hubert Niewiadomski and Onur Mutlu and Torsten Hoefler},
      year={2024},
      eprint={2401.14295},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2401.14295},
      keywords = {Chain of Thought}
}

@INPROCEEDINGS{10203649,
  author={Ye, Shuquan and Xie, Yujia and Chen, Dongdong and Xu, Yichong and Yuan, Lu and Zhu, Chenguang and Liao, Jing},
  booktitle={CVPR},
  title={Improving Commonsense in Vision-Language Models via Knowledge Graph Riddles},
  year={2023},
  doi={10.1109/CVPR52729.2023.00259},
  pages={2634-2645},
  url={https://openaccess.thecvf.com/content/CVPR2023/papers/Ye_Improving_Commonsense_in_Vision-Language_Models_via_Knowledge_Graph_Riddles_CVPR_2023_paper.pdf},
  keywords={Knowledge Graph Embedding},
  }

@misc{rudy2023,
      title={Fusing Knowledge Graphs and Large Language Models},
      author={Rudy Agovic},
      year={2023},
      url = {https://www.youtube.com/watch?v=RBKHLt3n9rM},
      keywords = {LLM and KG}
}

@misc{Neo4j2023,
      title={RAG with a Neo4j Knowledge Graph: How it Works and How to Set It Up},
      author={Neo4j},
      year={2023},
      url = {https://www.youtube.com/watch?v=ftlZ0oeXYRE},
      keywords = {LLM and KG}
}

@misc{wang2024infuserki,
      title={InfuserKI: Enhancing Large Language Models with Knowledge Graphs via Infuser-Guided Knowledge Integration},
      author={Fali Wang and Runxue Bao and Suhang Wang and Wenchao Yu and Yanchi Liu and Wei Cheng and Haifeng Chen},
      year={2024},
      eprint={2402.11441},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/pdf/2402.11441.pdf},
      keywords = {LLM and KG}
}

@ARTICLE{10417790,
  author={Yang, Linyao and Chen, Hongyang and Li, Zhao and Ding, Xiao and Wu, Xindong},
  journal={IEEE Transactions on Knowledge and Data Engineering},
  title={Give Us the Facts: Enhancing Large Language Models with Knowledge Graphs for Fact-aware Language Modeling},
  year={2024},
  url = {https://ieeexplore.ieee.org/abstract/document/10417790},
  pages={1-20},
  keywords={LLM and KG},
  doi={10.1109/TKDE.2024.3360454}
  }

@misc{zhang2023making,
      title={Making Large Language Models Perform Better in Knowledge Graph Completion},
      author={Yichi Zhang and Zhuo Chen and Wen Zhang and Huajun Chen},
      year={2023},
      eprint={2310.06671},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      keywords = {LLM and KG},
      url = {https://arxiv.org/abs/2310.06671}
}

@misc{microsoft2024,
      title={GraphRAG: Unlocking LLM discovery on narrative private data},
      author={Jonathan Larson, Steven Truitt},
      year={2024},
      url = {https://www.microsoft.com/en-us/research/blog/graphrag-unlocking-llm-discovery-on-narrative-private-data/},
      keywords = {LLM and KG}
}

@misc{li2023graphadapter,
      title={GraphAdapter: Tuning Vision-Language Models With Dual Knowledge Graph},
      author={Xin Li and Dongze Lian and Zhihe Lu and Jiawang Bai and Zhibo Chen and Xinchao Wang},
      booktitle = {NeurIPS},
      year={2024},
      eprint={2309.13625},
      archivePrefix={arXiv},
      primaryClass={cs.CV},
      keywords = {LLM and KG},
      url = {https://openreview.net/pdf?id=YmEDnMynuO}
}

@misc{wang2023learning,
      title={Learning Hierarchical Prompt with Structured Linguistic Knowledge for Vision-Language Models},
      author={Yubin Wang and Xinyang Jiang and De Cheng and Dongsheng Li and Cairong Zhao},
      booktitle = {AAAI},
      year={2024},
      eprint={2312.06323},
      archivePrefix={arXiv},
      primaryClass={cs.CV},
      keywords = {LLM and KG},
      url = {https://arxiv.org/pdf/2312.06323.pdf}
}

@misc{jiang2024unlocking,
      title={Unlocking the Power of Large Language Models for Entity Alignment},
      author={Xuhui Jiang and Yinghan Shen and Zhichao Shi and Chengjin Xu and Wei Li and Zixuan Li and Jian Guo and Huawei Shen and Yuanzhuo Wang},
      year={2024},
      eprint={2402.15048},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/pdf/2402.15048.pdf},
      keywords = {Knowledge Fusion}
}

@misc{yang2024heads,
      title={Two Heads Are Better Than One: Integrating Knowledge from Knowledge Graphs and Large Language Models for Entity Alignment},
      author={Linyao Yang and Hongyang Chen and Xiao Wang and Jing Yang and Fei-Yue Wang and Han Liu},
      year={2024},
      eprint={2401.16960},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2401.16960},
      keywords = {Knowledge Fusion}
}

@misc{wang2024rat,
      title={RAT: Retrieval Augmented Thoughts Elicit Context-Aware Reasoning in Long-Horizon Generation},
      author={Zihao Wang and Anji Liu and Haowei Lin and Jiaqi Li and Xiaojian Ma and Yitao Liang},
      year={2024},
      eprint={2403.05313},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2403.05313},
      keywords = {Chain of Thought}
}

@misc{bansal2024llm,
      title={LLM Augmented LLMs: Expanding Capabilities through Composition},
      author={Rachit Bansal and Bidisha Samanta and Siddharth Dalmia and Nitish Gupta and Shikhar Vashishth and Sriram Ganapathy and Abhishek Bapna and Prateek Jain and Partha Talukdar},
      year={2024},
      eprint={2401.02412},
      archivePrefix={arXiv},
      primaryClass={cs.LG},
      url = {https://openreview.net/pdf?id=jjA4O1vJRz},
      keywords = {Knowledge Fusion}
}

@misc{xu2024large,
      title={Large Multi-Modal Models (LMMs) as Universal Foundation Models for AI-Native Wireless Systems},
      author={Shengzhe Xu and Christo Kurisummoottil Thomas and Omar Hashash and Nikhil Muralidhar and Walid Saad and Naren Ramakrishnan},
      year={2024},
      eprint={2402.01748},
      archivePrefix={arXiv},
      primaryClass={cs.NI},
      url = {https://arxiv.org/abs/2402.01748},
      keywords = {Application}
}

@misc{goddard2024arcees,
      title={Arcee's MergeKit: A Toolkit for Merging Large Language Models},
      author={Charles Goddard and Shamane Siriwardhana and Malikeh Ehghaghi and Luke Meyers and Vlad Karpukhin and Brian Benedict and Mark McQuade and Jacob Solawetz},
      year={2024},
      eprint={2403.13257},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2403.13257},
      keywords = {Knowledge Fusion}
}

@misc{yoon2024langbridge,
      title={LangBridge: Multilingual Reasoning Without Multilingual Supervision},
      author={Dongkeun Yoon and Joel Jang and Sungdong Kim and Seungone Kim and Sheikh Shafayat and Minjoon Seo},
      year={2024},
      eprint={2401.10695},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2401.10695},
      keywords = {Knowledge Fusion}
}

@misc{feng2024dont,
      title={Don't Hallucinate, Abstain: Identifying LLM Knowledge Gaps via Multi-LLM Collaboration},
      author={Shangbin Feng and Weijia Shi and Yike Wang and Wenxuan Ding and Vidhisha Balachandran and Yulia Tsvetkov},
      year={2024},
      eprint={2402.00367},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2402.00367},
      keywords = {Knowledge Fusion}
}

@misc{qiao2024autoact,
      title={AUTOACT: Automatic Agent Learning from Scratch via Self-Planning},
      author={Shuofei Qiao and Ningyu Zhang and Runnan Fang and Yujie Luo and Wangchunshu Zhou and Yuchen Eleanor Jiang and Chengfei Lv and Huajun Chen},
      year={2024},
      eprint={2401.05268},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2401.05268},
      keywords = {Agent}
}

@inproceedings{DBLP:conf/nips/LiuLWL23a,
  author       = {Haotian Liu and
                  Chunyuan Li and
                  Qingyang Wu and
                  Yong Jae Lee},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Visual Instruction Tuning},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/6dcf277ea32ce3288914faf369fe6de0-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:20 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuLWL23a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@inproceedings{DBLP:conf/nips/Dai0LTZW0FH23,
  author       = {Wenliang Dai and
                  Junnan Li and
                  Dongxu Li and
                  Anthony Meng Huat Tiong and
                  Junqi Zhao and
                  Weisheng Wang and
                  Boyang Li and
                  Pascale Fung and
                  Steven C. H. Hoi},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {InstructBLIP: Towards General-purpose Vision-Language Models with
                  Instruction Tuning},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/9a6a435e75419a836fe47ab6793623e6-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:20 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Dai0LTZW0FH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@article{DBLP:journals/corr/abs-2401-15884,
  author       = {Shi{-}Qi Yan and
                  Jia{-}Chen Gu and
                  Yun Zhu and
                  Zhen{-}Hua Ling},
  title        = {Corrective Retrieval Augmented Generation},
  journal      = {CoRR},
  volume       = {abs/2401.15884},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.15884},
  doi          = {10.48550/ARXIV.2401.15884},
  eprinttype    = {arXiv},
  eprint       = {2401.15884},
  timestamp    = {Tue, 06 Feb 2024 14:15:49 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-15884.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Retrieval-Augmented Language Model}
}

@inproceedings{DBLP:conf/emnlp/Jiao0LZOJ023,
  author       = {Yizhu Jiao and
                  Ming Zhong and
                  Sha Li and
                  Ruining Zhao and
                  Siru Ouyang and
                  Heng Ji and
                  Jiawei Han},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Instruct and Extract: Instruction Tuning for On-Demand Information
                  Extraction},
  booktitle    = {EMNLP},
  pages        = {10030--10051},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.emnlp-main.620},
  timestamp    = {Wed, 13 Dec 2023 17:20:20 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/Jiao0LZOJ023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/nips/YangSLZGLS23,
  author       = {Rui Yang and
                  Lin Song and
                  Yanwei Li and
                  Sijie Zhao and
                  Yixiao Ge and
                  Xiu Li and
                  Ying Shan},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {GPT4Tools: Teaching Large Language Model to Use Tools via Self-instruction},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/e393677793767624f2821cec8bdd02f1-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:21 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangSLZGLS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@inproceedings{DBLP:conf/nips/YinWCSLLH0S0SO23,
  author       = {Zhenfei Yin and
                  Jiong Wang and
                  Jianjian Cao and
                  Zhelun Shi and
                  Dingning Liu and
                  Mukai Li and
                  Xiaoshui Huang and
                  Zhiyong Wang and
                  Lu Sheng and
                  Lei Bai and
                  Jing Shao and
                  Wanli Ouyang},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {{LAMM:} Language-Assisted Multi-Modal Instruction-Tuning Dataset,
                  Framework, and Benchmark},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/548a41b9cac6f50dccf7e63e9e1b1b9b-Abstract-Datasets\_and\_Benchmarks.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:20 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YinWCSLLH0S0SO23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@article{DBLP:journals/corr/abs-2312-01954,
  author       = {Andrea Papaluca and
                  Daniel Krefl and
                  Sergio Mendez Rodriguez and
                  Artem Lenskiy and
                  Hanna Suominen},
  title        = {Zero- and Few-Shots Knowledge Graph Triplet Extraction with Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2312.01954},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.01954},
  doi          = {10.48550/ARXIV.2312.01954},
  eprinttype    = {arXiv},
  eprint       = {2312.01954},
  timestamp    = {Tue, 12 Dec 2023 16:18:22 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-01954.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/emnlp/XieLZZLW23,
  author       = {Tingyu Xie and
                  Qi Li and
                  Jian Zhang and
                  Yan Zhang and
                  Zuozhu Liu and
                  Hongwei Wang},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Empirical Study of Zero-Shot {NER} with ChatGPT},
  booktitle    = {EMNLP},
  pages        = {7935--7956},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.emnlp-main.493},
  timestamp    = {Wed, 13 Dec 2023 17:20:20 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/XieLZZLW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2401-13218,
  author       = {Xinliang Frederick Zhang and
                  Carter Wood Blum and
                  Temma Choji and
                  Shalin Shah and
                  Alakananda Vempala},
  title        = {{ULTRA:} Unleash LLMs' Potential for Event Argument Extraction through
                  Hierarchical Modeling and Pair-wise Refinement},
  journal      = {CoRR},
  volume       = {abs/2401.13218},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.13218},
  doi          = {10.48550/ARXIV.2401.13218},
  eprinttype    = {arXiv},
  eprint       = {2401.13218},
  timestamp    = {Mon, 05 Feb 2024 16:06:53 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-13218.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@misc{heng2024proggen,
      title={ProgGen: Generating Named Entity Recognition Datasets Step-by-step with Self-Reflexive Large Language Models},
      author={Yuzhao Heng and Chunyuan Deng and Yitong Li and Yue Yu and Yinghao Li and Rongzhi Zhang and Chao Zhang},
      year={2024},
      eprint={2403.11103},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/pdf/2403.11103.pdf},
      keywords = {Information Extraction}
}

@misc{li2024simple,
      title={A Simple but Effective Approach to Improve Structured Language Model Output for Information Extraction},
      author={Yinghao Li and Rampi Ramprasad and Chao Zhang},
      year={2024},
      eprint={2402.13364},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/pdf/2402.13364.pdf},
      keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2402-06861,
  author       = {Yansong Ning and
                  Hao Liu},
  title        = {UrbanKGent: {A} Unified Large Language Model Agent Framework for Urban
                  Knowledge Graph Construction},
  journal      = {CoRR},
  volume       = {abs/2402.06861},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.06861},
  doi          = {10.48550/ARXIV.2402.06861},
  eprinttype    = {arXiv},
  eprint       = {2402.06861},
  timestamp    = {Fri, 16 Feb 2024 13:00:19 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-06861.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}


@misc{wu2024visualizationofthought,
      title={Visualization-of-Thought Elicits Spatial Reasoning in Large Language Models},
      author={Wenshan Wu and Shaoguang Mao and Yadong Zhang and Yan Xia and Li Dong and Lei Cui and Furu Wei},
      year={2024},
      eprint={2404.03622},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2404.03622},
      keywords = {Chain of Thought}
}

@misc{xu2023large,
      title={Are Large Language Models Really Good Logical Reasoners? A Comprehensive Evaluation and Beyond},
      author={Fangzhi Xu and Qika Lin and Jiawei Han and Tianzhe Zhao and Jun Liu and Erik Cambria},
      year={2023},
      eprint={2306.09841},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2306.09841},
      keywords = {Symbolic Reasoning}
}

@misc{rudy2023,
      title={Towards Systematic Evaluation of Logical Reasoning Ability of Large Language Models},
      author={Anonymous Submission},
      journal = {ACL},
      year={2024},
      url = {https://openreview.net/pdf?id=1xms2oSsqc},
      keywords = {Symbolic Reasoning}
}

@inproceedings{DBLP:conf/emnlp/XiuX022,
  author       = {Yeliang Xiu and
                  Zhanhao Xiao and
                  Yongmei Liu},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {LogicNMR: Probing the Non-monotonic Reasoning Ability of Pre-trained
                  Language Models},
  booktitle    = {EMNLP},
  pages        = {3616--3626},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.265},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.265},
  timestamp    = {Thu, 10 Aug 2023 12:35:27 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/XiuX022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Reasoning}
}
@article{DBLP:journals/corr/abs-2402-11140,
  author       = {Sijia Chen and
                  Baochun Li and
                  Di Niu},
  title        = {Boosting of Thoughts: Trial-and-Error Problem Solving with Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2402.11140},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.11140},
  doi          = {10.48550/ARXIV.2402.11140},
  eprinttype    = {arXiv},
  eprint       = {2402.11140},
  timestamp    = {Mon, 26 Feb 2024 16:52:48 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-11140.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2310-04562,
  author       = {Mikhail Galkin and
                  Xinyu Yuan and
                  Hesham Mostafa and
                  Jian Tang and
                  Zhaocheng Zhu},
  title        = {Towards Foundation Models for Knowledge Graph Reasoning},
  journal      = {CoRR},
  volume       = {abs/2310.04562},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.04562},
  doi          = {10.48550/ARXIV.2310.04562},
  eprinttype    = {arXiv},
  eprint       = {2310.04562},
  timestamp    = {Fri, 20 Oct 2023 12:04:38 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-04562.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Graph Embedding}
}


@article{DBLP:journals/tgdk/PanRKSCDJO0LBMB23,
  author       = {Jeff Z. Pan and
                  Simon Razniewski and
                  Jan{-}Christoph Kalo and
                  Sneha Singhania and
                  Jiaoyan Chen and
                  Stefan Dietze and
                  Hajira Jabeen and
                  Janna Omeliyanenko and
                  Wen Zhang and
                  Matteo Lissandrini and
                  Russa Biswas and
                  Gerard de Melo and
                  Angela Bonifati and
                  Edlira Vakaj and
                  Mauro Dragoni and
                  Damien Graux},
  title        = {Large Language Models and Knowledge Graphs: Opportunities and Challenges},
  journal      = {TGDK},
  volume       = {1},
  number       = {1},
  pages        = {2:1--2:38},
  year         = {2023},
  url          = {https://doi.org/10.4230/TGDK.1.1.2},
  doi          = {10.4230/TGDK.1.1.2},
  timestamp    = {Tue, 19 Dec 2023 17:15:12 +0100},
  biburl       = {https://dblp.org/rec/journals/tgdk/PanRKSCDJO0LBMB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}

@inproceedings{DBLP:conf/rep4nlp/SinghaniaRW23,
  author       = {Sneha Singhania and
                  Simon Razniewski and
                  Gerhard Weikum},
  editor       = {Burcu Can and
                  Maximilian Mozes and
                  Samuel Cahyawijaya and
                  Naomi Saphra and
                  Nora Kassner and
                  Shauli Ravfogel and
                  Abhilasha Ravichander and
                  Chen Zhao and
                  Isabelle Augenstein and
                  Anna Rogers and
                  Kyunghyun Cho and
                  Edward Grefenstette and
                  Lena Voita},
  title        = {Extracting Multi-valued Relations from Language Models},
  booktitle    = {ACL},
  pages        = {139--154},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.repl4nlp-1.12},
  doi          = {10.18653/V1/2023.REPL4NLP-1.12},
  timestamp    = {Thu, 10 Aug 2023 12:36:13 +0200},
  biburl       = {https://dblp.org/rec/conf/rep4nlp/SinghaniaRW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@inproceedings{DBLP:conf/emnlp/VeseliRKW23,
  author       = {Blerta Veseli and
                  Simon Razniewski and
                  Jan{-}Christoph Kalo and
                  Gerhard Weikum},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Evaluating the Knowledge Base Completion Potential of {GPT}},
  booktitle    = {EMNLP},
  pages        = {6432--6443},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.426},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.426},
  timestamp    = {Fri, 12 Apr 2024 13:11:38 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/VeseliRKW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords ={LLM and KG}
}

@article{DBLP:journals/corr/abs-2402-14273,
  author       = {Qiyuan He and
                  Yizhong Wang and
                  Wenya Wang},
  title        = {Can Language Models Act as Knowledge Bases at Scale?},
  journal      = {CoRR},
  volume       = {abs/2402.14273},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.14273},
  doi          = {10.48550/ARXIV.2402.14273},
  eprinttype    = {arXiv},
  eprint       = {2402.14273},
  timestamp    = {Fri, 22 Mar 2024 12:19:03 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-14273.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}

@article{DBLP:journals/corr/abs-2311-07914,
  author       = {Garima Agrawal and
                  Tharindu Kumarage and
                  Zeyad Alghami and
                  Huan Liu},
  title        = {Can Knowledge Graphs Reduce Hallucinations in LLMs? : {A} Survey},
  journal      = {NAACL},
  volume       = {abs/2311.07914},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2311.07914},
  doi          = {10.48550/ARXIV.2311.07914},
  eprinttype    = {arXiv},
  eprint       = {2311.07914},
  timestamp    = {Tue, 21 Nov 2023 13:55:21 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-07914.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}

@inproceedings{DBLP:conf/aaai/GuanLL0HH024,
  author       = {Xinyan Guan and
                  Yanjiang Liu and
                  Hongyu Lin and
                  Yaojie Lu and
                  Ben He and
                  Xianpei Han and
                  Le Sun},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Mitigating Large Language Model Hallucinations via Autonomous Knowledge
                  Graph-Based Retrofitting},
  booktitle    = {AAAI},
  pages        = {18126--18134},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i16.29770},
  doi          = {10.1609/AAAI.V38I16.29770},
  timestamp    = {Tue, 02 Apr 2024 16:32:09 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GuanLL0HH024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}

@article{DBLP:journals/corr/abs-2402-17358,
  author       = {Xinyu Lu and
                  Bowen Yu and
                  Yaojie Lu and
                  Hongyu Lin and
                  Haiyang Yu and
                  Le Sun and
                  Xianpei Han and
                  Yongbin Li},
  title        = {SoFA: Shielded On-the-fly Alignment via Priority Rule Following},
  journal      = {CoRR},
  volume       = {abs/2402.17358},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.17358},
  doi          = {10.48550/ARXIV.2402.17358},
  eprinttype    = {arXiv},
  eprint       = {2402.17358},
  timestamp    = {Mon, 25 Mar 2024 15:38:17 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-17358.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}


@article{DBLP:journals/corr/abs-2402-18243,
  author       = {Mengjie Ren and
                  Boxi Cao and
                  Hongyu Lin and
                  Cao Liu and
                  Xianpei Han and
                  Ke Zeng and
                  Guanglu Wan and
                  Xunliang Cai and
                  Le Sun},
  title        = {Learning or Self-aligning? Rethinking Instruction Fine-tuning},
  journal      = {CoRR},
  volume       = {abs/2402.18243},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.18243},
  doi          = {10.48550/ARXIV.2402.18243},
  eprinttype    = {arXiv},
  eprint       = {2402.18243},
  timestamp    = {Tue, 26 Mar 2024 10:51:46 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-18243.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@inproceedings{DBLP:conf/aaai/ChenQJC24,
  author       = {Ruirui Chen and
                  Chengwei Qin and
                  Weifeng Jiang and
                  Dongkyu Choi},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Is a Large Language Model a Good Annotator for Event Extraction?},
  booktitle    = {AAAI},
  pages        = {17772--17780},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i16.29730},
  doi          = {10.1609/AAAI.V38I16.29730},
  timestamp    = {Thu, 11 Apr 2024 16:45:45 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ChenQJC24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2305-13972,
  author       = {Chuanyuan Tan and
                  Yuehe Chen and
                  Wenbiao Shao and
                  Wenliang Chen},
  title        = {Make a Choice! Knowledge Base Question Answering with In-Context Learning},
  journal      = {CoRR},
  volume       = {abs/2305.13972},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.13972},
  doi          = {10.48550/ARXIV.2305.13972},
  eprinttype    = {arXiv},
  eprint       = {2305.13972},
  timestamp    = {Mon, 05 Jun 2023 15:42:15 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-13972.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}

@article{DBLP:journals/corr/abs-2305-01750,
  author       = {Tianle Li and
                  Xueguang Ma and
                  Alex Zhuang and
                  Yu Gu and
                  Yu Su and
                  Wenhu Chen},
  title        = {Few-shot In-context Learning for Knowledge Base Question Answering},
  journal      = {CoRR},
  volume       = {abs/2305.01750},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.01750},
  doi          = {10.48550/ARXIV.2305.01750},
  eprinttype    = {arXiv},
  eprint       = {2305.01750},
  timestamp    = {Tue, 18 Jul 2023 07:50:20 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-01750.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}

@inproceedings{DBLP:conf/aaai/NieZW024,
  author       = {Zhijie Nie and
                  Richong Zhang and
                  Zhongyuan Wang and
                  Xudong Liu},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Code-Style In-Context Learning for Knowledge-Based Question Answering},
  booktitle    = {AAAI},
  pages        = {18833--18841},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i17.29848},
  doi          = {10.1609/AAAI.V38I17.29848},
  timestamp    = {Tue, 02 Apr 2024 16:32:09 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/NieZW024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}


@article{DBLP:journals/corr/abs-2311-02956,
  author       = {Yunlong Chen and
                  Yaming Zhang and
                  Jianfei Yu and
                  Li Yang and
                  Rui Xia},
  title        = {In-Context Learning for Knowledge Base Question Answering for Unmanned
                  Systems based on Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2311.02956},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.02956},
  doi          = {10.48550/ARXIV.2311.02956},
  eprinttype    = {arXiv},
  eprint       = {2311.02956},
  timestamp    = {Wed, 08 Nov 2023 15:46:55 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-02956.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}


@article{DBLP:journals/corr/abs-2310-09158,
  author       = {Meiqi Chen and
                  Yubo Ma and
                  Kaitao Song and
                  Yixin Cao and
                  Yan Zhang and
                  Dongsheng Li},
  title        = {Learning To Teach Large Language Models Logical Reasoning},
  journal      = {CoRR},
  volume       = {abs/2310.09158},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.09158},
  doi          = {10.48550/ARXIV.2310.09158},
  eprinttype    = {arXiv},
  eprint       = {2310.09158},
  timestamp    = {Wed, 10 Apr 2024 15:48:06 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-09158.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}

@article{DBLP:journals/corr/abs-2401-16960,
  author       = {Linyao Yang and
                  Hongyang Chen and
                  Xiao Wang and
                  Jing Yang and
                  Fei{-}Yue Wang and
                  Han Liu},
  title        = {Two Heads Are Better Than One: Integrating Knowledge from Knowledge
                  Graphs and Large Language Models for Entity Alignment},
  journal      = {CoRR},
  volume       = {abs/2401.16960},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.16960},
  doi          = {10.48550/ARXIV.2401.16960},
  eprinttype    = {arXiv},
  eprint       = {2401.16960},
  timestamp    = {Tue, 06 Feb 2024 14:15:49 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-16960.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Fusion}
}


@article{DBLP:journals/corr/abs-2311-14379,
  author       = {Xuan Xiao and
                  Jiahang Liu and
                  Zhipeng Wang and
                  Yanmin Zhou and
                  Yong Qi and
                  Qian Cheng and
                  Bin He and
                  Shuo Jiang},
  title        = {Robot Learning in the Era of Foundation Models: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2311.14379},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.14379},
  doi          = {10.48550/ARXIV.2311.14379},
  eprinttype    = {arXiv},
  eprint       = {2311.14379},
  timestamp    = {Tue, 02 Jan 2024 21:36:37 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-14379.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Application}
}

@article{DBLP:journals/corr/abs-2402-05827,
  author       = {Xinbei Ma and
                  Tianjie Ju and
                  Jiyang Qiu and
                  Zhuosheng Zhang and
                  Hai Zhao and
                  Lifeng Liu and
                  Yulong Wang},
  title        = {Is it Possible to Edit Large Language Models Robustly?},
  journal      = {CoRR},
  volume       = {abs/2402.05827},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.05827},
  doi          = {10.48550/ARXIV.2402.05827},
  eprinttype    = {arXiv},
  eprint       = {2402.05827},
  timestamp    = {Thu, 21 Mar 2024 16:25:22 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-05827.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}

@article{DBLP:journals/corr/abs-2402-04978,
  author       = {Yihao Li and
                  Ru Zhang and
                  Jianyi Liu and
                  Gongshen Liu},
  title        = {An Enhanced Prompt-Based {LLM} Reasoning Scheme via Knowledge Graph-Integrated
                  Collaboration},
  journal      = {CoRR},
  volume       = {abs/2402.04978},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.04978},
  doi          = {10.48550/ARXIV.2402.04978},
  eprinttype    = {arXiv},
  eprint       = {2402.04978},
  timestamp    = {Wed, 14 Feb 2024 16:31:41 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-04978.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}

@article{DBLP:journals/corr/abs-2403-15736,
  author       = {Xin Zhang and
                  Tianjie Ju and
                  Huijia Liang and
                  Ying Fu and
                  Qin Zhang},
  title        = {LLMs Instruct LLMs: An Extraction and Editing Method},
  journal      = {CoRR},
  volume       = {abs/2403.15736},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.15736},
  doi          = {10.48550/ARXIV.2403.15736},
  eprinttype    = {arXiv},
  eprint       = {2403.15736},
  timestamp    = {Tue, 09 Apr 2024 15:12:39 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-15736.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {LLM and KG}
}

@misc{rudy2023,
      title={Unleashing the Power of Large Language Models in Zero-shot Relation Extraction via Self-Prompting},
      author={Anonymous Submission},
      journal = {ACL},
      year={2024},
      url = {https://openreview.net/pdf?id=HZnVY_PrFN},
      keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/ijcnlp/KimIBHNM23,
  author       = {Bosung Kim and
                  Hayate Iso and
                  Nikita Bhutani and
                  Estevam Hruschka and
                  Ndapa Nakashole and
                  Tom M. Mitchell},
  editor       = {Jong C. Park and
                  Yuki Arase and
                  Baotian Hu and
                  Wei Lu and
                  Derry Wijaya and
                  Ayu Purwarianti and
                  Adila Alfa Krisnadhi},
  title        = {Zero-shot Triplet Extraction by Template Infilling},
  booktitle    = {IJCNLP},
  pages        = {272--284},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.ijcnlp-main.18},
  doi          = {10.18653/V1/2023.IJCNLP-MAIN.18},
  timestamp    = {Fri, 12 Apr 2024 13:12:03 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/KimIBHNM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@misc{rudy2023,
      title={LLM Instruction-Example Adaptive Prompting (LEAP) Framework for Clinical Relation Extraction},
      author={Anonymous Submission},
      journal = {CORR},
      year={2023},
      url = {https://www.medrxiv.org/content/10.1101/2023.12.15.23300059v1.full.pdf},
      keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/emnlp/Ma0HS23,
  author       = {Yubo Ma and
                  Yixin Cao and
                  Yong Hong and
                  Aixin Sun},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Large Language Model Is Not a Good Few-shot Information Extractor,
                  but a Good Reranker for Hard Samples!},
  booktitle    = {EMNLP},
  pages        = {10572--10601},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.710},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.710},
  timestamp    = {Fri, 12 Apr 2024 13:11:41 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/Ma0HS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@misc{zhang2024unified,
    title={A Unified Label-Aware Contrastive Learning Framework for Few-Shot Named Entity Recognition},
    author={Haojie Zhang and Yimeng Zhuang},
    year={2024},
    eprint={2404.17178},
    archivePrefix={arXiv},
    primaryClass={cs.CL},
    url = {https://arxiv.org/pdf/2404.17178},
    keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2402-14568,
  author       = {Junjie Ye and
                  Nuo Xu and
                  Yikun Wang and
                  Jie Zhou and
                  Qi Zhang and
                  Tao Gui and
                  Xuanjing Huang},
  title        = {{LLM-DA:} Data Augmentation via Large Language Models for Few-Shot
                  Named Entity Recognition},
  journal      = {CoRR},
  volume       = {abs/2402.14568},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.14568},
  doi          = {10.48550/ARXIV.2402.14568},
  eprinttype    = {arXiv},
  eprint       = {2402.14568},
  timestamp    = {Fri, 22 Mar 2024 12:19:03 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-14568.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@inproceedings{DBLP:conf/emnlp/MaLZ23a,
  author       = {Xilai Ma and
                  Jing Li and
                  Min Zhang},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Chain of Thought with Explicit Evidence Reasoning for Few-shot Relation
                  Extraction},
  booktitle    = {EMNLP},
  pages        = {2334--2352},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.153},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.153},
  timestamp    = {Fri, 12 Apr 2024 13:11:52 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/MaLZ23a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@article{DBLP:journals/corr/abs-2306-00024,
  author       = {Zelalem Gero and
                  Chandan Singh and
                  Hao Cheng and
                  Tristan Naumann and
                  Michel Galley and
                  Jianfeng Gao and
                  Hoifung Poon},
  title        = {Self-Verification Improves Few-Shot Clinical Information Extraction},
  journal      = {CoRR},
  volume       = {abs/2306.00024},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.00024},
  doi          = {10.48550/ARXIV.2306.00024},
  eprinttype    = {arXiv},
  eprint       = {2306.00024},
  timestamp    = {Thu, 11 Apr 2024 13:33:57 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-00024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@misc{munnangi2024onthefly,
    title={On-the-fly Definition Augmentation of LLMs for Biomedical NER},
    author={Monica Munnangi and Sergey Feldman and Byron C Wallace and Silvio Amir and Tom Hope and Aakanksha Naik},
    year={2024},
    eprint={2404.00152},
    archivePrefix={arXiv},
    primaryClass={cs.CL},
    url = {https://arxiv.org/pdf/2404.00152},
    keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2402-12563,
  author       = {Loka Li and
                  Guangyi Chen and
                  Yusheng Su and
                  Zhenhao Chen and
                  Yixuan Zhang and
                  Eric Xing and
                  Kun Zhang},
  title        = {Confidence Matters: Revisiting Intrinsic Self-Correction Capabilities
                  of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.12563},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.12563},
  doi          = {10.48550/ARXIV.2402.12563},
  eprinttype    = {arXiv},
  eprint       = {2402.12563},
  timestamp    = {Thu, 21 Mar 2024 15:46:29 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-12563.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}


@inproceedings{DBLP:conf/emnlp/PangCD023,
  author       = {Chaoxu Pang and
                  Yixuan Cao and
                  Qiang Ding and
                  Ping Luo},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Guideline Learning for In-Context Information Extraction},
  booktitle    = {EMNLP},
  pages        = {15372--15389},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.950},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.950},
  timestamp    = {Fri, 12 Apr 2024 13:11:46 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/PangCD023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2402-18909,
  author       = {Xiaobao Wu and
                  Liangming Pan and
                  William Yang Wang and
                  Anh Tuan Luu},
  title        = {Updating Language Models with Unstructured Facts: Towards Practical
                  Knowledge Editing},
  journal      = {CoRR},
  volume       = {abs/2402.18909},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.18909},
  doi          = {10.48550/ARXIV.2402.18909},
  eprinttype    = {arXiv},
  eprint       = {2402.18909},
  timestamp    = {Tue, 26 Mar 2024 10:51:46 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-18909.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}

@article{DBLP:journals/corr/abs-2402-13093,
  author       = {Hao Peng and
                  Xiaozhi Wang and
                  Chunyang Li and
                  Kaisheng Zeng and
                  Jiangshan Duo and
                  Yixin Cao and
                  Lei Hou and
                  Juanzi Li},
  title        = {Event-level Knowledge Editing},
  journal      = {CoRR},
  volume       = {abs/2402.13093},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13093},
  doi          = {10.48550/ARXIV.2402.13093},
  eprinttype    = {arXiv},
  eprint       = {2402.13093},
  timestamp    = {Wed, 10 Apr 2024 15:48:06 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13093.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Editing}
}

@article{DBLP:journals/corr/abs-2402-13741,
  author       = {Guozheng Li and
                  Wenjun Ke and
                  Peng Wang and
                  Zijie Xu and
                  Ke Ji and
                  Jiajun Liu and
                  Ziyu Shang and
                  Qiqing Luo},
  title        = {Unlocking Instructive In-Context Learning with Tabular Prompting for
                  Relational Triple Extraction},
  journal      = {CoRR},
  volume       = {abs/2402.13741},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13741},
  doi          = {10.48550/ARXIV.2402.13741},
  eprinttype    = {arXiv},
  eprint       = {2402.13741},
  timestamp    = {Fri, 22 Mar 2024 12:19:03 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13741.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@misc{li2024meta,
      title={Meta In-Context Learning Makes Large Language Models Better Zero and Few-Shot Relation Extractors},
      author={Guozheng Li and Peng Wang and Jiajun Liu and Yikai Guo and Ke Ji and Ziyu Shang and Zijie Xu},
      year={2024},
      eprint={2404.17807},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2404.17807}
      keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/nips/Coda-FornoBABWS23,
  author       = {Julian Coda{-}Forno and
                  Marcel Binz and
                  Zeynep Akata and
                  Matt M. Botvinick and
                  Jane X. Wang and
                  Eric Schulz},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Meta-in-context learning in large language models},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/cda04d7ea67ea1376bf8c6962d8541e0-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:20 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Coda-FornoBABWS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@inproceedings{DBLP:conf/aaai/ChenZSHSGG24,
  author       = {Zhenfang Chen and
                  Qinhong Zhou and
                  Yikang Shen and
                  Yining Hong and
                  Zhiqing Sun and
                  Dan Gutfreund and
                  Chuang Gan},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Visual Chain-of-Thought Prompting for Knowledge-Based Visual Reasoning},
  booktitle    = {AAAI},
  pages        = {1254--1262},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i2.27888},
  doi          = {10.1609/AAAI.V38I2.27888},
  timestamp    = {Tue, 02 Apr 2024 16:32:08 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ChenZSHSGG24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@inproceedings{DBLP:conf/nips/ZhengYTZY23,
  author       = {Ge Zheng and
                  Bin Yang and
                  Jiajin Tang and
                  Hong{-}Yu Zhou and
                  Sibei Yang},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {DDCoT: Duty-Distinct Chain-of-Thought Prompting for Multimodal Reasoning
                  in Language Models},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/108030643e640ac050e0ed5e6aace48f-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:19 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhengYTZY23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}


@article{DBLP:journals/corr/abs-2304-07919,
  author       = {Jiaxin Ge and
                  Hongyin Luo and
                  Siyuan Qian and
                  Yulu Gan and
                  Jie Fu and
                  Shanghang Zhang},
  title        = {Chain of Thought Prompt Tuning in Vision Language Models},
  journal      = {CoRR},
  volume       = {abs/2304.07919},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.07919},
  doi          = {10.48550/ARXIV.2304.07919},
  eprinttype    = {arXiv},
  eprint       = {2304.07919},
  timestamp    = {Fri, 21 Apr 2023 11:01:56 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-07919.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}


@inproceedings{DBLP:conf/aaai/HeZHCXHZLX24,
  author       = {Qianyu He and
                  Jie Zeng and
                  Wenhao Huang and
                  Lina Chen and
                  Jin Xiao and
                  Qianxi He and
                  Xunzhe Zhou and
                  Jiaqing Liang and
                  Yanghua Xiao},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Can Large Language Models Understand Real-World Complex Instructions?},
  booktitle    = {AAAI},
  pages        = {18188--18196},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i16.29777},
  doi          = {10.1609/AAAI.V38I16.29777},
  timestamp    = {Tue, 02 Apr 2024 16:32:09 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HeZHCXHZLX24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Instruction Tuning}
}

@inproceedings{DBLP:conf/aaai/LiuZLWLJJXC24,
  author       = {Jingping Liu and
                  Mingchuan Zhang and
                  Weichen Li and
                  Chao Wang and
                  Shuang Li and
                  Haiyun Jiang and
                  Sihang Jiang and
                  Yanghua Xiao and
                  Yunwen Chen},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Beyond Entities: {A} Large-Scale Multi-Modal Knowledge Graph with
                  Triplet Fact Grounding},
  booktitle    = {AAAI},
  pages        = {18653--18661},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i17.29828},
  doi          = {10.1609/AAAI.V38I17.29828},
  timestamp    = {Tue, 02 Apr 2024 16:32:09 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuZLWLJJXC24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2401-05669,
  author       = {Xintao Wang and
                  Zhouhong Gu and
                  Jiaqing Liang and
                  Dakuan Lu and
                  Yanghua Xiao and
                  Wei Wang},
  title        = {ConcEPT: Concept-Enhanced Pre-Training for Language Models},
  journal      = {CoRR},
  volume       = {abs/2401.05669},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.05669},
  doi          = {10.48550/ARXIV.2401.05669},
  eprinttype    = {arXiv},
  eprint       = {2401.05669},
  timestamp    = {Thu, 25 Jan 2024 15:41:08 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-05669.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Enhanced}
}


@article{DBLP:journals/corr/abs-2401-11624,
  author       = {Man Luo and
                  Xin Xu and
                  Yue Liu and
                  Panupong Pasupat and
                  Mehran Kazemi},
  title        = {In-context Learning with Retrieved Demonstrations for Language Models:
                  {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2401.11624},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.11624},
  doi          = {10.48550/ARXIV.2401.11624},
  eprinttype    = {arXiv},
  eprint       = {2401.11624},
  timestamp    = {Mon, 05 Feb 2024 16:06:53 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-11624.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@article{DBLP:journals/corr/abs-2403-06402,
  author       = {Manish Chandra and
                  Debasis Ganguly and
                  Yiwen Li and
                  Iadh Ounis},
  title        = {'One size doesn't fit all': Learning how many Examples to use for
                  In-Context Learning for Improved Text Classification},
  journal      = {CoRR},
  volume       = {abs/2403.06402},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.06402},
  doi          = {10.48550/ARXIV.2403.06402},
  eprinttype    = {arXiv},
  eprint       = {2403.06402},
  timestamp    = {Thu, 04 Apr 2024 15:22:22 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-06402.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}

@misc{zhang2024unified,
    title={"In-Context Learning" or: How I learned to stop worrying and love "Applied Information Retrieval"},
    author={Andrew Parry and Debasis Ganguly and Manish Chandra},
    year={2024},
    eprint={2405.01116},
    archivePrefix={arXiv},
    primaryClass={cs.CL},
    url = {https://arxiv.org/abs/2405.01116},
    keywords = {In-Context Learning}
}

@inproceedings{DBLP:conf/emnlp/YoussefKLSS23,
  author       = {Paul Youssef and
                  Osman Alperen Koras and
                  Meijie Li and
                  J{\"{o}}rg Schl{\"{o}}tterer and
                  Christin Seifert},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Give Me the Facts! {A} Survey on Factual Knowledge Probing in Pre-trained
                  Language Models},
  booktitle    = {EMNLP},
  pages        = {15588--15605},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.1043},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.1043},
  timestamp    = {Fri, 12 Apr 2024 13:11:43 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YoussefKLSS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Language Model as Knowledge Base}
}

@article{DBLP:journals/corr/abs-2402-14373,
  author       = {Xuemei Tang and
                  Jun Wang and
                  Qi Su},
  title        = {Small Language Model Is a Good Guide for Large Language Model in Chinese
                  Entity Relation Extraction},
  journal      = {CoRR},
  volume       = {abs/2402.14373},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.14373},
  doi          = {10.48550/ARXIV.2402.14373},
  eprinttype    = {arXiv},
  eprint       = {2402.14373},
  timestamp    = {Fri, 22 Mar 2024 12:19:03 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-14373.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@inproceedings{DBLP:conf/aaai/LiMWHJ0X0J24,
  author       = {Yangning Li and
                  Shirong Ma and
                  Xiaobin Wang and
                  Shen Huang and
                  Chengyue Jiang and
                  Haitao Zheng and
                  Pengjun Xie and
                  Fei Huang and
                  Yong Jiang},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {EcomGPT: Instruction-Tuning Large Language Models with Chain-of-Task
                  Tasks for E-commerce},
  booktitle    = {AAAI},
  pages        = {18582--18590},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i17.29820},
  doi          = {10.1609/AAAI.V38I17.29820},
  timestamp    = {Tue, 02 Apr 2024 16:32:09 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiMWHJ0X0J24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Application}
}

@inproceedings{DBLP:conf/nips/LiSGPO23,
  author       = {Yingcong Li and
                  Kartik Sreenivasan and
                  Angeliki Giannou and
                  Dimitris Papailiopoulos and
                  Samet Oymak},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Dissecting Chain-of-Thought: Compositionality through In-Context Filtering
                  and Learning},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/45e15bae91a6f213d45e203b8a29be48-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:20 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiSGPO23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}


@misc{wang2024grokked,
      title={Grokked Transformers are Implicit Reasoners: A Mechanistic Journey to the Edge of Generalization},
      author={Boshi Wang and Xiang Yue and Yu Su and Huan Sun},
      year={2024},
      eprint={2405.15071},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2405.15071},
      keywords = {Symbolic Reasoning}
}

@inproceedings{DBLP:conf/nips/SwaminathanDRSL23,
  author       = {Sivaramakrishnan Swaminathan and
                  Antoine Dedieu and
                  Rajkumar Vasudeva Raju and
                  Murray Shanahan and
                  Miguel L{\'{a}}zaro{-}Gredilla and
                  Dileep George},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Schema-learning and rebinding as mechanisms of in-context learning
                  and emergence},
  booktitle    = {NeurIPS},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/5bc3356e0fa1753fff7e8d6628e71b22-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 16:26:20 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SwaminathanDRSL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}

@misc{ozyurt2024documentlevel,
      title={Document-Level In-Context Few-Shot Relation Extraction via Pre-Trained Language Models},
      author={Yilmazcan Ozyurt and Stefan Feuerriegel and Ce Zhang},
      year={2024},
      eprint={2310.11085},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url = {https://arxiv.org/abs/2310.11085},
      keywords = {Information Extraction}
}


@article{DBLP:journals/corr/abs-2311-08993,
  author       = {Hao Peng and
                  Xiaozhi Wang and
                  Jianhui Chen and
                  Weikai Li and
                  Yunjia Qi and
                  Zimu Wang and
                  Zhili Wu and
                  Kaisheng Zeng and
                  Bin Xu and
                  Lei Hou and
                  Juanzi Li},
  title        = {When does In-context Learning Fall Short and Why? {A} Study on Specification-Heavy
                  Tasks},
  journal      = {CoRR},
  volume       = {abs/2311.08993},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.08993},
  doi          = {10.48550/ARXIV.2311.08993},
  eprinttype    = {arXiv},
  eprint       = {2311.08993},
  timestamp    = {Tue, 07 May 2024 20:16:46 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-08993.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {In-Context Learning}
}


@article{DBLP:journals/corr/abs-2402-18041,
  author       = {Yang Liu and
                  Jiahuan Cao and
                  Chongyu Liu and
                  Kai Ding and
                  Lianwen Jin},
  title        = {Datasets for Large Language Models: {A} Comprehensive Survey},
  journal      = {CoRR},
  volume       = {abs/2402.18041},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.18041},
  doi          = {10.48550/ARXIV.2402.18041},
  eprinttype    = {arXiv},
  eprint       = {2402.18041},
  timestamp    = {Tue, 26 Mar 2024 10:51:46 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-18041.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Survey}
}


@article{DBLP:journals/corr/abs-2311-06736,
  author       = {Ying Su and
                  Xiaojin Fu and
                  Mingwen Liu and
                  Zhijiang Guo},
  title        = {Are LLMs Rigorous Logical Reasoner? Empowering Natural Language Proof
                  Generation with Contrastive Stepwise Decoding},
  journal      = {CoRR},
  volume       = {abs/2311.06736},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.06736},
  doi          = {10.48550/ARXIV.2311.06736},
  eprinttype    = {arXiv},
  eprint       = {2311.06736},
  timestamp    = {Wed, 15 Nov 2023 16:23:10 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-06736.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Symbolic Reasoning}
}


@inproceedings{DBLP:conf/ijcnlp/LyuHSZRWAC23,
  author       = {Qing Lyu and
                  Shreya Havaldar and
                  Adam Stein and
                  Li Zhang and
                  Delip Rao and
                  Eric Wong and
                  Marianna Apidianaki and
                  Chris Callison{-}Burch},
  editor       = {Jong C. Park and
                  Yuki Arase and
                  Baotian Hu and
                  Wei Lu and
                  Derry Wijaya and
                  Ayu Purwarianti and
                  Adila Alfa Krisnadhi},
  title        = {Faithful Chain-of-Thought Reasoning},
  booktitle    = {IJCNLP},
  pages        = {305--329},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.ijcnlp-main.20},
  doi          = {10.18653/V1/2023.IJCNLP-MAIN.20},
  timestamp    = {Fri, 12 Apr 2024 13:12:04 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/LyuHSZRWAC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords  = {Chain of Thought}
}


@inproceedings{DBLP:conf/emnlp/WeiH0K23,
  author       = {Yanbin Wei and
                  Qiushi Huang and
                  Yu Zhang and
                  James T. Kwok},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {{KICGPT:} Large Language Model with Knowledge in Context for Knowledge
                  Graph Completion},
  booktitle    = {EMNLP},
  pages        = {8667--8683},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.580},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.580},
  timestamp    = {Fri, 12 Apr 2024 13:11:40 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WeiH0K23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Graph Embedding}
}

@inproceedings{DBLP:conf/acl/Aly0M20,
  author       = {Rami Aly and
                  Andreas Vlachos and
                  Ryan McDonald},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Leveraging Type Descriptions for Zero-shot Named Entity Recognition
                  and Classification},
  booktitle    = {ACL},
  pages        = {1516--1528},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.120},
  doi          = {10.18653/V1/2021.ACL-LONG.120},
  timestamp    = {Tue, 07 May 2024 20:08:12 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Aly0M20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Information Extraction}
}

@article{DBLP:journals/corr/abs-2402-17231,
  author       = {Debrup Das and
                  Debopriyo Banerjee and
                  Somak Aditya and
                  Ashish Kulkarni},
  title        = {{MATHSENSEI:} {A} Tool-Augmented Large Language Model for Mathematical
                  Reasoning},
  journal      = {CoRR},
  volume       = {abs/2402.17231},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.17231},
  doi          = {10.48550/ARXIV.2402.17231},
  eprinttype    = {arXiv},
  eprint       = {2402.17231},
  timestamp    = {Mon, 25 Mar 2024 15:38:17 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-17231.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Arithmetic Reasoning}
}

@inproceedings{DBLP:conf/esws/SaeedizadeB24,
  author       = {Mohammad Javad Saeedizade and
                  Eva Blomqvist},
  editor       = {Albert Mero{\~{n}}o{-}Pe{\~{n}}uela and
                  Anastasia Dimou and
                  Rapha{\"{e}}l Troncy and
                  Olaf Hartig and
                  Maribel Acosta and
                  Mehwish Alam and
                  Heiko Paulheim and
                  Pasquale Lisena},
  title        = {Navigating Ontology Development with Large Language Models},
  booktitle    = {ESWC},
  series       = {Lecture Notes in Computer Science},
  volume       = {14664},
  pages        = {143--161},
  publisher    = {Springer},
  year         = {2024},
  url          = {https://doi.org/10.1007/978-3-031-60626-7\_8},
  doi          = {10.1007/978-3-031-60626-7\_8},
  timestamp    = {Tue, 18 Jun 2024 09:23:51 +0200},
  biburl       = {https://dblp.org/rec/conf/esws/SaeedizadeB24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Knowledge Graph Embedding}
}

@article{DBLP:journals/corr/abs-2402-11199,
  author       = {Minh{-}Vuong Nguyen and
                  Linhao Luo and
                  Fatemeh Shiri and
                  Dinh Phung and
                  Yuan{-}Fang Li and
                  Thuy{-}Trang Vu and
                  Gholamreza Haffari},
  title        = {Direct Evaluation of Chain-of-Thought in Multi-hop Reasoning with
                  Knowledge Graphs},
  journal      = {CoRR},
  volume       = {abs/2402.11199},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.11199},
  doi          = {10.48550/ARXIV.2402.11199},
  eprinttype    = {arXiv},
  eprint       = {2402.11199},
  timestamp    = {Mon, 26 Feb 2024 16:52:48 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-11199.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@misc{chu2024navigateenigmaticlabyrinthsurvey,
      title={Navigate through Enigmatic Labyrinth A Survey of Chain of Thought Reasoning: Advances, Frontiers and Future},
      author={Zheng Chu and Jingchang Chen and Qianglong Chen and Weijiang Yu and Tao He and Haotian Wang and Weihua Peng and Ming Liu and Bing Qin and Ting Liu},
      year={2024},
      eprint={2309.15402},
      archivePrefix={arXiv},
      primaryClass={cs.CL},
      url={https://arxiv.org/abs/2309.15402},
      keywords = {Chain of Thought}
}

@inproceedings{DBLP:conf/emnlp/WangLZ23,
  author       = {Jinyuan Wang and
                  Junlong Li and
                  Hai Zhao},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Self-prompted Chain-of-Thought on Large Language Models for Open-domain
                  Multi-hop Reasoning},
  booktitle    = {EMNLP},
  pages        = {2717--2731},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.179},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.179},
  timestamp    = {Wed, 17 Jul 2024 07:49:06 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WangLZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@inproceedings{lin2024prompting,
  title={Prompting Few-shot Multi-hop Question Generation via Comprehending Type-aware Semantics},
  author={Zefeng Lin and Weidong Chen and Yan Song and Yongdong Zhang},
  booktitle={NAACL},
  pages={3730--3740},
  year={2024},
  url = {https://aclanthology.org/2024.findings-naacl.236.pdf},
  keywords = {Question Answering}
}

@inproceedings{DBLP:conf/emnlp/LiD23,
  author       = {Ruosen Li and
                  Xinya Du},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Leveraging Structured Information for Explainable Multi-hop Question
                  Answering and Reasoning},
  booktitle    = {EMNLP},
  pages        = {6779--6789},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.452},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.452},
  timestamp    = {Fri, 12 Apr 2024 13:11:45 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LiD23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Question Answering}
}


@article{DBLP:journals/corr/abs-2311-11797,
  author       = {Zhuosheng Zhang and
                  Yao Yao and
                  Aston Zhang and
                  Xiangru Tang and
                  Xinbei Ma and
                  Zhiwei He and
                  Yiming Wang and
                  Mark Gerstein and
                  Rui Wang and
                  Gongshen Liu and
                  Hai Zhao},
  title        = {Igniting Language Intelligence: The Hitchhiker's Guide From Chain-of-Thought
                  Reasoning to Language Agents},
  journal      = {CoRR},
  volume       = {abs/2311.11797},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.11797},
  doi          = {10.48550/ARXIV.2311.11797},
  eprinttype    = {arXiv},
  eprint       = {2311.11797},
  timestamp    = {Thu, 11 Apr 2024 16:45:45 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-11797.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2404-05221,
  author       = {Shibo Hao and
                  Yi Gu and
                  Haotian Luo and
                  Tianyang Liu and
                  Xiyan Shao and
                  Xinyuan Wang and
                  Shuhua Xie and
                  Haodi Ma and
                  Adithya Samavedhi and
                  Qiyue Gao and
                  Zhen Wang and
                  Zhiting Hu},
  title        = {{LLM} Reasoners: New Evaluation, Library, and Analysis of Step-by-Step
                  Reasoning with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2404.05221},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.05221},
  doi          = {10.48550/ARXIV.2404.05221},
  eprinttype    = {arXiv},
  eprint       = {2404.05221},
  timestamp    = {Wed, 15 May 2024 08:47:08 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-05221.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords = {Chain of Thought}
}

@article{DBLP:journals/corr/abs-2406-05673,
  author       = {Fangxu Yu and
                  Lai Jiang and
                  Haoqiang Kang and
                  Shibo Hao and
                  Lianhui Qin},
  title        = {Flow of Reasoning: Efficient Training of {LLM} Policy with Divergent
                  Thinking},
  journal      = {CoRR},
  volume       = {abs/2406.05673},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.05673},
  doi          = {10.48550/ARXIV.2406.05673},
  eprinttype    = {arXiv},
  eprint       = {2406.05673},
  timestamp    = {Sat, 13 Jul 2024 22:06:59 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-05673.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org},
  keywords =  {Chain of Thought}
}