Tewari and Bartlett. "Bounded Parameter Markov Decision Processes with Average Reward Criterion." Annual Conference on Computational Learning Theory, 2007. doi:10.1007/978-3-540-72927-3_20
Markdown
[Tewari and Bartlett. "Bounded Parameter Markov Decision Processes with Average Reward Criterion." Annual Conference on Computational Learning Theory, 2007.](https://mlanthology.org/colt/2007/tewari2007colt-bounded/) doi:10.1007/978-3-540-72927-3_20
BibTeX
@inproceedings{tewari2007colt-bounded,
title = {{Bounded Parameter Markov Decision Processes with Average Reward Criterion}},
author = {Tewari, Ambuj and Bartlett, Peter L.},
booktitle = {Annual Conference on Computational Learning Theory},
year = {2007},
pages = {263-277},
doi = {10.1007/978-3-540-72927-3_20},
url = {https://mlanthology.org/colt/2007/tewari2007colt-bounded/}
}