Even-Dar et al. "PAC Bounds for Multi-Armed Bandit and Markov Decision Processes." Annual Conference on Computational Learning Theory, 2002. doi:10.1007/3-540-45435-7_18
Markdown
[Even-Dar et al. "PAC Bounds for Multi-Armed Bandit and Markov Decision Processes." Annual Conference on Computational Learning Theory, 2002.](https://mlanthology.org/colt/2002/evendar2002colt-pac/) doi:10.1007/3-540-45435-7_18
BibTeX
@inproceedings{evendar2002colt-pac,
title = {{PAC Bounds for Multi-Armed Bandit and Markov Decision Processes}},
author = {Even-Dar, Eyal and Mannor, Shie and Mansour, Yishay},
booktitle = {Annual Conference on Computational Learning Theory},
year = {2002},
pages = {255-270},
doi = {10.1007/3-540-45435-7_18},
url = {https://mlanthology.org/colt/2002/evendar2002colt-pac/}
}