- HotpotQA code in
hotpotqa
- GQA code in
gqa
@article{rerest,
title={Reflection-Reinforced Self-Training for Language Agents},
author={Dou, Zi-Yi and Yang, Cheng-Fu and Wu, Xueqing and Chang, Kai-Wei and Peng, Nanyun},
journal={arXiv preprint},
year={2024}
}