@inproceedings{zhang2023unified,title={Unified Off-Policy Learning to Rank: a Reinforcement Learning Perspective},author={Zhang, Zeyu and Su, Yi and Yuan, Hui and Wu, Yiran and Balasubramanian, Rishab and Wu, Qingyun and Wang, Huazheng and Wang, Mengdi},booktitle={Advances in Neural Information Processing Systems},volume={36},pages={19887--19907},year={2023},publisher={Curran Associates, Inc.},editor={Oh, A. and Naumann, T. and Globerson, A. and Saenko, K. and Hardt, M. and Levine, S.},url={https://proceedings.neurips.cc/paper_files/paper/2023/file/3f1b6e97a5eb3b10e6b0c99b022988eb-Paper-Conference.pdf},}
Co-authored Publications
AISTATS
LAMP: Extracting Locally Linear Decision Surfaces from LLM World Models
Ryan Chen, Youngmin Ko, Zeyu Zhang, and 5 more authors
@misc{chen2025lamp,title={LAMP: Extracting Locally Linear Decision Surfaces from LLM World Models},author={Chen, Ryan and Ko, Youngmin and Zhang, Zeyu and Cho, Catherine and Chung, Sunny and Giuffré, Mauro and Shung, Dennis L. and Stadie, Bradly C.},year={2025},archiveprefix={arXiv},primaryclass={cs.LG},url={https://arxiv.org/abs/2505.11772},}