Ortner. "Online Regret Bounds for Markov Decision Processes with Deterministic Transitions." International Conference on Algorithmic Learning Theory, 2008. doi:10.1007/978-3-540-87987-9_14
Markdown
[Ortner. "Online Regret Bounds for Markov Decision Processes with Deterministic Transitions." International Conference on Algorithmic Learning Theory, 2008.](https://mlanthology.org/alt/2008/ortner2008alt-online/) doi:10.1007/978-3-540-87987-9_14
BibTeX
@inproceedings{ortner2008alt-online,
title = {{Online Regret Bounds for Markov Decision Processes with Deterministic Transitions}},
author = {Ortner, Ronald},
booktitle = {International Conference on Algorithmic Learning Theory},
year = {2008},
pages = {123-137},
doi = {10.1007/978-3-540-87987-9_14},
url = {https://mlanthology.org/alt/2008/ortner2008alt-online/}
}