A Survey on Human Preference Learning for Large Language Models. Jiang, R., Chen, K., Bai, X., He, Z., Li, J., Yang, M., Zhao, T., Nie, L., & Zhang, M. arXiv preprint arXiv:2406.11191, 2024.
bibtex   
@article{jiang2024survey,
  title={A Survey on Human Preference Learning for Large Language Models},
  author={Jiang, Ruili and Chen, Kehai and Bai, Xuefeng and He, Zhixuan and Li, Juntao and Yang, Muyun and Zhao, Tiejun and Nie, Liqiang and Zhang, Min},
  journal={arXiv preprint arXiv:2406.11191},
  year={2024}
}

Downloads: 0