Cheng et al. "Preference-Based Policy Iteration: Leveraging Preference Learning for Reinforcement Learning." European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases, 2011. doi:10.1007/978-3-642-23780-5_30
Markdown
[Cheng et al. "Preference-Based Policy Iteration: Leveraging Preference Learning for Reinforcement Learning." European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases, 2011.](https://mlanthology.org/ecmlpkdd/2011/cheng2011ecmlpkdd-preferencebased/) doi:10.1007/978-3-642-23780-5_30
BibTeX
@inproceedings{cheng2011ecmlpkdd-preferencebased,
title = {{Preference-Based Policy Iteration: Leveraging Preference Learning for Reinforcement Learning}},
author = {Cheng, Weiwei and Fürnkranz, Johannes and Hüllermeier, Eyke and Park, Sang-Hyeun},
booktitle = {European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases},
year = {2011},
pages = {312-327},
doi = {10.1007/978-3-642-23780-5_30},
url = {https://mlanthology.org/ecmlpkdd/2011/cheng2011ecmlpkdd-preferencebased/}
}