This is the repository that contains source code for the Think-RM website.
If you find Think-RM useful for your work please cite:
@misc{hong2025thinkrmenablinglonghorizonreasoning,
title={Think-RM: Enabling Long-Horizon Reasoning in Generative Reward Models},
author={Ilgee Hong and Changlong Yu and Liang Qiu and Weixiang Yan and Zhenghao Xu and Haoming Jiang and Qingru Zhang and Qin Lu and Xin Liu and Chao Zhang and Tuo Zhao},
year={2025},
eprint={2505.16265},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2505.16265},
}
This work is licensed under a Creative Commons Attribution-ShareAlike 4.0 International License.
