- HotpotQA code in 
hotpotqa - GQA code in 
gqa 
@article{rerest,
  title={Reflection-Reinforced Self-Training for Language Agents},
  author={Dou, Zi-Yi and Yang, Cheng-Fu and Wu, Xueqing and Chang, Kai-Wei and Peng, Nanyun},
  journal={arXiv preprint},
  year={2024}
}