@article{he2025verir1precisefaithfulclaim,title={Veri-R1: Toward Precise and Faithful Claim Verification via Online Reinforcement Learning},author={He, Qi and Qian, Cheng and Chen, Xiusi and He, Bingxiang and Fung, Yi R. and Ji, Heng},booktitle={arXiv preprint},year={2025},}
NeurIPS
Toolrl: Reward is all tool learning needs
Cheng Qian, Emre Can Acikgoz, Qi He, and 5 more authors
@article{qian2025toolrl,title={Toolrl: Reward is all tool learning needs},author={Qian, Cheng and Acikgoz, Emre Can and He, Qi and Wang, Hongru and Chen, Xiusi and Hakkani-T{\"u}r, Dilek and Tur, Gokhan and Ji, Heng},booktitle={Annual Conference on Neural Information Processing Systems},year={2025},}
2024
arXiv
From individual to society: A survey on social simulation driven by large language model-based agents
Xinyi Mou, Xuanwen Ding, Qi He, and 8 more authors
@article{mou2024individual,title={From individual to society: A survey on social simulation driven by large language model-based agents},author={Mou, Xinyi and Ding, Xuanwen and He, Qi and Wang, Liang and Liang, Jingcong and Zhang, Xinnong and Sun, Libo and Lin, Jiayu and Zhou, Jie and Huang, Xuanjing and others},booktitle={arXiv preprint},year={2024},}