Fürnkranz et al. "Preference-Based Reinforcement Learning: A Formal Framework and a Policy Iteration Algorithm." Machine Learning, 2012. doi:10.1007/S10994-012-5313-8
Markdown
[Fürnkranz et al. "Preference-Based Reinforcement Learning: A Formal Framework and a Policy Iteration Algorithm." Machine Learning, 2012.](https://mlanthology.org/mlj/2012/furnkranz2012mlj-preferencebased/) doi:10.1007/S10994-012-5313-8
BibTeX
@article{furnkranz2012mlj-preferencebased,
title = {{Preference-Based Reinforcement Learning: A Formal Framework and a Policy Iteration Algorithm}},
author = {Fürnkranz, Johannes and Hüllermeier, Eyke and Cheng, Weiwei and Park, Sang-Hyeun},
journal = {Machine Learning},
year = {2012},
pages = {123-156},
doi = {10.1007/S10994-012-5313-8},
volume = {89},
url = {https://mlanthology.org/mlj/2012/furnkranz2012mlj-preferencebased/}
}